{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 171,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "import nltk\n",
    "import jieba\n",
    "import jieba.posseg as pseg\n",
    "from nltk.tokenize import word_tokenize "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.1 使用词性标注器"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "text = nltk.word_tokenize(\"And now for something completely different\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('And', 'CC'),\n",
       " ('now', 'RB'),\n",
       " ('for', 'IN'),\n",
       " ('something', 'NN'),\n",
       " ('completely', 'RB'),\n",
       " ('different', 'JJ')]"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.pos_tag(text)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "words = pseg.cut(\"我爱北京天安门\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "我 r\n",
      "爱 v\n",
      "北京 ns\n",
      "天安门 ns\n"
     ]
    }
   ],
   "source": [
    "for word, flag in words:\n",
    "    print('%s %s' % (word, flag))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "RB: adverb\n",
      "    occasionally unabatingly maddeningly adventurously professedly\n",
      "    stirringly prominently technologically magisterially predominately\n",
      "    swiftly fiscally pitilessly ...\n"
     ]
    }
   ],
   "source": [
    "nltk.help.upenn_tagset('RB')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "有时候句子里面可能会包括一些同形同音异义词\n",
    "他们拒绝授予我们 垃圾排放许可证  前两个都是动词，后两个是名词\n",
    "我们需要知道正在使用哪一个词以便能正确读课文。（出于这个原因，文本转\n",
    "语音系统通常要进行词性标注。）\n",
    "\"\"\"\n",
    "text = nltk.word_tokenize(\"They refuse to permit us to obtain the refuse permit\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('They', 'PRP'),\n",
       " ('refuse', 'VBP'),\n",
       " ('to', 'TO'),\n",
       " ('permit', 'VB'),\n",
       " ('us', 'PRP'),\n",
       " ('to', 'TO'),\n",
       " ('obtain', 'VB'),\n",
       " ('the', 'DT'),\n",
       " ('refuse', 'NN'),\n",
       " ('permit', 'NN')]"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.pos_tag(text)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "showing info https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/index.xml\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "True"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.download()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "text = nltk.Text(word.lower() for word in nltk.corpus.brown.words())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<Text: the fulton county grand jury said friday an...>"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "text"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "man time day year car moment world house family child country boy\n",
      "state job place way war girl work word\n"
     ]
    }
   ],
   "source": [
    "text.similar('woman')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "made said done put had seen found given left heard was been brought\n",
      "set got that took in told felt\n"
     ]
    }
   ],
   "source": [
    "text.similar('bought')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "in on to of and for with from at by that into as up out down through\n",
      "is all about\n"
     ]
    }
   ],
   "source": [
    "text.similar('over')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "a his this their its her an that our any all one these my in your no\n",
      "some other and\n"
     ]
    }
   ],
   "source": [
    "text.similar('the')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.2 标注语料库"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tagged_token = nltk.tag.str2tuple('fly/NN')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "('fly', 'NN')"
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tagged_token"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "sent = '''\n",
    "    The/AT grand/JJ jury/NN commented/VBD on/IN a/AT number/NN of/IN\n",
    "    other/AP topics/NNS ,/, AMONG/IN them/PPO the/AT Atlanta/NP and/CC\n",
    "    Fulton/NP-tl County/NN-tl purchasing/VBG departments/NNS which/WDT it/PPS\n",
    "    said/VBD ``/`` ARE/BER well/QL operated/VBN and/CC follow/VB generally/RB\n",
    "    accepted/VBN practices/NNS which/WDT inure/VB to/IN the/AT best/JJT\n",
    "    interest/NN of/IN both/ABX governments/NNS ''/'' ./.\n",
    "'''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('The', 'AT'),\n",
       " ('grand', 'JJ'),\n",
       " ('jury', 'NN'),\n",
       " ('commented', 'VBD'),\n",
       " ('on', 'IN'),\n",
       " ('a', 'AT'),\n",
       " ('number', 'NN'),\n",
       " ('of', 'IN'),\n",
       " ('other', 'AP'),\n",
       " ('topics', 'NNS'),\n",
       " (',', ','),\n",
       " ('AMONG', 'IN'),\n",
       " ('them', 'PPO'),\n",
       " ('the', 'AT'),\n",
       " ('Atlanta', 'NP'),\n",
       " ('and', 'CC'),\n",
       " ('Fulton', 'NP-TL'),\n",
       " ('County', 'NN-TL'),\n",
       " ('purchasing', 'VBG'),\n",
       " ('departments', 'NNS'),\n",
       " ('which', 'WDT'),\n",
       " ('it', 'PPS'),\n",
       " ('said', 'VBD'),\n",
       " ('``', '``'),\n",
       " ('ARE', 'BER'),\n",
       " ('well', 'QL'),\n",
       " ('operated', 'VBN'),\n",
       " ('and', 'CC'),\n",
       " ('follow', 'VB'),\n",
       " ('generally', 'RB'),\n",
       " ('accepted', 'VBN'),\n",
       " ('practices', 'NNS'),\n",
       " ('which', 'WDT'),\n",
       " ('inure', 'VB'),\n",
       " ('to', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('best', 'JJT'),\n",
       " ('interest', 'NN'),\n",
       " ('of', 'IN'),\n",
       " ('both', 'ABX'),\n",
       " ('governments', 'NNS'),\n",
       " (\"''\", \"''\"),\n",
       " ('.', '.')]"
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[nltk.tag.str2tuple(t) for t in sent.strip().split()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('The', 'AT'), ('Fulton', 'NP-TL'), ...]"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.brown.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('now', 'RB'), ('im', 'PRP'), ('left', 'VBD'), ...]"
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.nps_chat.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('Confidence', 'NN'), ('in', 'IN'), ('the', 'DT'), ...]"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.conll2000.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('Pierre', 'NNP'), ('Vinken', 'NNP'), (',', ','), ...]"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.treebank.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "ename": "TypeError",
     "evalue": "tagged_words() got an unexpected keyword argument 'simplify_tags'",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-40-dcf0c78aeea0>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mnltk\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcorpus\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mbrown\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mtagged_words\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0msimplify_tags\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;32mTrue\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;31mTypeError\u001b[0m: tagged_words() got an unexpected keyword argument 'simplify_tags'"
     ]
    }
   ],
   "source": [
    "nltk.corpus.brown.tagged_words(simplify_tags=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('The', 'DET'), ('Fulton', 'NOUN'), ...]"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.brown.tagged_words(tagset='universal')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('一', 'Neu'), ('友情', 'Nad'), ('嘉珍', 'Nba'), ...]"
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.sinica_treebank.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('মহিষের', 'NN'), ('সন্তান', 'NN'), (':', 'SYM'), ...]"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "nltk.corpus.indian.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from nltk.corpus import brown\n",
    "\n",
    "brown_news_tagged = brown.tagged_words(categories='news', tagset='universal')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tag_fd = nltk.FreqDist(tag for (word, tag) in brown_news_tagged)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('NOUN', 30654),\n",
       " ('VERB', 14399),\n",
       " ('ADP', 12355),\n",
       " ('.', 11928),\n",
       " ('DET', 11389),\n",
       " ('ADJ', 6706),\n",
       " ('ADV', 3349),\n",
       " ('CONJ', 2717),\n",
       " ('PRON', 2535),\n",
       " ('PRT', 2264),\n",
       " ('NUM', 2166),\n",
       " ('X', 92)]"
      ]
     },
     "execution_count": 52,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tag_fd.most_common()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZsAAAEeCAYAAABc5biTAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAIABJREFUeJzt3Xl8VdW5//HPl3mSWTEKAioOgFWbqDhWpVZqbUXrgK1X\n2lJtq7VeO/yU28HWll691nqr1unWVrRVoVoF5wGcqoImODAoBUQEBCmzEqYkz++PtSKHGEJI9j47\nOTzv1+u8ss/aw7N2IOc5a+2115aZ4ZxzzqWpRdYVcM45V/g82TjnnEudJxvnnHOp82TjnHMudZ5s\nnHPOpc6TjXPOudR5snHOOZc6TzbOOedS58nGOedc6lplXYGmomfPntavX78G779+/Xrat2+fXIWa\nSKxCj1fI55bveIV8bvmO15zOraysbLmZ7brdDc3MX2YUFxdbY5SWljZq/6Yaq9DjFfK55TteIZ9b\nvuM1p3MDSq0en7Hejeaccy51nmycc86lzpONc8651Hmycc45lzpPNs4551LnycY551zqUks2kv4s\naZmkGTll3SU9LWlO/NktZ91oSXMlzZZ0ck55saTpcd0NkhTL20oaF8unSuqXs8/IGGOOpJFpnaNz\nzrn6SfOmzjuBm4C7csquACaZ2dWSrojvL5c0EBgBDAL2AJ6RtJ+ZVQK3ABcAU4HHgGHA48AoYJWZ\n7StpBHANcI6k7sCVQAlgQJmkiWa2KsVzdc65xtm8Hj54HRa9Rt93XoYFXcEqwaqgKv7MfX1SVv3T\naimr3s5qKavezjho4wY4eCa0apva6aWWbMzshdzWRnQacHxcHgs8B1wey+8zs43AfElzgcMlvQd0\nNrMpAJLuAoYTks1pwC/jse4HboqtnpOBp81sZdznaUKCujfpc3TOuQYxg9ULYOFrsOhVWPQaLJ0O\nVRUA9ARYmL/qtIGQfFKU7+lqepnZkri8FOgVl/cEpuRstyiWbY7LNcur91kIYGYVktYAPXLLa9nH\nOefyb9O6T1otIcG8BuuWbb2NWkCvwdD7MBZs6krfffYPZS1aghSW1TKnrPq9ailrEcta1FKWsxzf\nvzVjJp9pmV6rBjKcG83MTJJlFR9A0oXAhQBFRUWUlZU1+Fjl5eWN2r+pxir0eIV8bvmOV8jntkPx\nzGhT/gGdVs2iY3x1WDsP1Wg5VLTuzMfdB7Ku60DWdR/Iuq4HUNWqwyexlld2SKjmVfG1beXWibLX\nX08oXu3ynWw+lFRkZkskFQHVqX0x0Cdnu96xbHFcrlmeu88iSa2ALsCKWH58jX2eq60yZnY7cDtA\nSUmJFRcXN/jEysrKaMz+TTVWoccr5HPLd7xCPrc64238GD6YtnWrpXz51tuoBex+EPQ+HPocDr0P\no1X3vekq0XVHYqUkH/HynWwmAiOBq+PPCTnl90j6PWGAwADgVTOrlLRW0hDCAIHzgRtrHOsV4Exg\ncmwtPQn8Nmek2xeA0emfmnOu4JnBinkhoVRfa/lw5qevd3ToGZNKSUgwexwKbTtlU+cmIrVkI+le\nQgujp6RFhBFiVwPjJY0CFgBnA5jZTEnjgVlABXBxHIkGcBFhZFt7wsCAx2P5HcDdcTDBSsJoNsxs\npaRfA6/F7a6qHizgnHM7ZFM5LC6DhVPYZ8Yz8My/YH2NjxO1hKKDQ1LpfRj0OQy69Q/XUtwn0hyN\ndu42Vg3dxvZjgDG1lJcCg2sp3wCctY1j/Rn4c70r65xzAB99CAunwPvxtfStT0aIfdLd1XHX2B12\nWGy1HAJtOmZW5ebCH57mnNs5VVXB8tlbEsvCKbDqva23qb7W0mcI71bsxt7HnQ1d+3qrpQE82Tjn\ndg6b18PiafD+K7BwKix8FTas3nqb1h1Di6XPENjrCNizBNp1BmBVWRl065f/ehcITzbOucL08b+3\n7hJb8iZUbd56m132gL2GhFefI8J9Li39YzEN/lt1zjV/VVWwYk5otbw/NSSZle/W2Eghmew1ZEvL\npUsf7xLLE082zrnmZ/MGOq6YDi8+H7vEpsL6GtMftu4AexbDXkeGxNL7MGjXJZv6Ok82zrlmoLIi\nTPcy//nwen8qB1Ru3HqbTrtv3SW2+0HQsnU29XWf4snGOdf0VFXBspkw/4Xweu8l2PTRVpus36U/\n7fc/YUuXmI8Sa9I82TjnsmcWrrG8+1xMLi9C+Yqtt+m+D/Q/Dvb+HPQ7llnvLMjrlC6ucTzZOOey\nsWZxbLk8H36uXbz1+l32CIml/3Hh1aV3jQMsyFtVXeN5snHO5ce65aHFMv8FePd5WDlv6/Xtu29J\nLP0/Bz328W6xAuLJxjmXjg1rYcHLW667fDh96/VtOkHfo7e0XnYbFJ6/4gqSJxvnXCJUuSm0WKq7\nxhZPC48drtaybbiQ3/846H98mFPMR4vtNDzZOOcaxgyWzYK5k2DeJA5576Wt79BXyzBRZXXXWJ8j\noHW77OrrMuXJxjlXf+Ur4d1nYe5kmDcJPlryyaoWAL0O2tIttteRn8wr5pwnG+fctlVWwOLST1ov\nLJ4G5DzNvVMv2OdE2Gcob37cnYOPqvUJIs55snHO1bB6YUgsc5+Bd1+AjWu2rGvZJtyhv89Q2Hdo\nmGssjhirKCvLqMKuOfBk49zOblM5LHhpS+tl+b+2Xt99n5BY9v089DvGHxTmGsSTjXM7mxoX9lnw\nCuTOM9Zml3DdZZ8TQ5LxZ7i4BHiycW5nUMeFfRDsceiWrrHeh/mQZJe4TJKNpEuBCwAB/2dm/yup\nOzAO6Ae8B5xtZqvi9qOBUUAl8AMzezKWFwN3Au2Bx4BLzcwktQXuAoqBFcA5ZvZevs7PucxVVcHi\nUoreuQum/WQbF/Zjctn7eOjYM6OKup1F3pONpMGERHM4sAl4QtIjwIXAJDO7WtIVwBXA5ZIGAiOA\nQcAewDOS9jOzSuCWeKyphGQzDHickJhWmdm+kkYA1wDn5PM8ncs7s5BUZv4DZvwDPvqAParX1XFh\n37l8yKJlcyAw1czKASQ9D5wBnAYcH7cZCzwHXB7L7zOzjcB8SXOBwyW9B3Q2synxOHcBwwnJ5jTg\nl/FY9wM3SZKZ5Xy1c64AmMGHM2DGAyHBrM6ZnLJLH5Z1L2G3I8/1C/suc1kkmxnAGEk9gPXAKUAp\n0MvMqjuSlwK94vKewJSc/RfFss1xuWZ59T4LAcysQtIaoAewPPGzcS4L//5XbME8sPXosU67w6DT\nYfBXoXcJC6dNY7f9fBp+l728Jxsze1vSNcBTwDrgDcK1mNxtTFLqrRBJFxK67ygqKqKsEfcJlJeX\nN2r/phqr0OM1p3NrU76EboufpfsHz9Jh7ZYZkze36cLqouNYuceJfNxjcJgmZhmwbJr/LptpvEI8\nt0wGCJjZHcAdAJJ+S2iVfCipyMyWSCoi/LkALAb65OzeO5Ytjss1y3P3WSSpFdCFMFCgZj1uB24H\nKCkpscY8iKmsrCxvD3LKZ6xCj9fkz23NYpj5YGjFLM75MGjbBQ78Mgw+g9b9P8euLVuxaxLxGqHJ\n/y6bUbxCPLesRqPtZmbLJO1FuF4zBOgPjASujj8nxM0nAvdI+j1hgMAA4FUzq5S0VtIQwgCB84Eb\nc/YZCbwCnAlM9us1rtn4eBnMmhCuwbz/8pby1h3hgFNCF9k+J0KrttnV0bkdlNV9Ng/EazabgYvN\nbLWkq4HxkkYRHsF3NoCZzZQ0HpgFVMTtq7vdLmLL0OfH4wtCq+nuOJhgJWE0m3NNV/lKePvhcA3m\nvRfBqkJ5q3Yw4AshwQz4ArTpkG09nWugrLrRjq2lbAVQ6yx+ZjYGGFNLeSkwuJbyDcBZja+pcyna\nsBZmPxYSzLzJUFURylu0hgEnw+AzYP8vQttdsq2ncwnwGQScy6MWFetD99iMB2DO01umiVHL0DU2\n6Aw48FRo3y3bijqXME82zuXD+tXwzJV85o37oHJDLBT0PQYGnw4HngadarvE71xh8GTjXNrmTYYJ\n34e1i2kJYe6xQWfAoOHQeY/t7e1cQfBk41xaNq2Dp6+E1/4vvN+zmJkDLmbQ8V/Ntl7OZcCTjXNp\nWPgaPPgdWDkPWrSC46+Aoy9jwxtvZl0z5zLhyca5JFVsguf+G1763zB8ebeBcPqtUHRw1jVzLlOe\nbJxLytIZ8OB34cPpgODoS+GEn/rNl87hyca5xquqhJdvgMljoGpzeLLl8Fuh75FZ18y5JsOTjXON\nsWIePPQ9WDg1vC/5Fpz0a2jbKdt6OdfEeLJxriHMoPQOeOrnsLkcdimCr9wEAz6fdc2ca5I82Ti3\no9Z+EO6bmTcpvB98JpxyLXTonm29nGvCPNk4V19mMP3v8NiPYcOaMKXMl34f5jBzztXJk41z9bFu\nBTx6WZj6H8JEmV+5AXbZPdt6OddMeLJxbntmPwETL4F1y6BNJzj5t/DZ80HKumbONRuebJzblg1r\n4cnR8Ppfw/u+R8Pwm8PQZufcDvFk41xt5r8ID10Ea96Hlm1h6C9gyEXQokXWNXOuWfJk41yuzeth\n0lUw5ebwvuhgOP122O2AbOvlXDPnyca5aounhckzl/8rPMzsuB/DcT+Blq2zrplzzd52k42kjsB6\nM6uStB9wAPC4mW1OvXbO5UPlZnjhd/DCtWCV0HO/MHnmnsVZ18y5glGfls0LwLGSugFPAa8B5wBf\nT7NizuVDu4/egz/9EJa8EQqGXBSuz7Run2m9nCs09bnaKTMrB84Abjazs4BBjQkq6TJJMyXNkHSv\npHaSukt6WtKc+LNbzvajJc2VNFvSyTnlxZKmx3U3SGEsqqS2ksbF8qmS+jWmvq5AvTWeA1/4Tkg0\nXfrAyIdh2H97onEuBfVKNpKOJLRkHo1lLRsaUNKewA+AEjMbHI81ArgCmGRmA4BJ8T2SBsb1g4Bh\nwM2SquPfAlwADIivYbF8FLDKzPYFrgeuaWh9XYF69zl46Hu0qNoMh5wH33sZ+h+Xda2cK1j1STaX\nAqOBB81spqS9gWcbGbcV0F5SK6AD8AFwGjA2rh8LDI/LpwH3mdlGM5sPzAUOl1QEdDazKWZmwF01\n9qk+1v3A0OpWj3MsewfGnQ9VFSzd52wY/kdo1znrWjlX0OpzzaaXmX2l+o2ZvSvpxYYGNLPFkn4H\nvA+sB54ys6ck9TKzJXGzpUCvuLwnMCXnEIti2ea4XLO8ep+FMV6FpDVAD2B5bl0kXQhcCFBUVERZ\nWVlDT4vy8vJG7d9UYxVavFYbV3LAi9+n7cY1rNr9WOb0PY/FBXJuWccr5HPLd7yCPDczq/MFTKtP\nWX1fQDdgMrAr0Bp4CDgPWF1ju1Xx503AeTnldwBnAiXAMznlxwKPxOUZQO+cdfOAnnXVq7i42Bqj\ntLS0Ufs31VgFFW/jOrPbTzC7srPZbcebbVxXOOfWBOIV8rnlO15zOjeg1Orx2b/Nlo2kLwKnAHtK\nuiFnVWegohH57fPAfDP7d4zzD+Ao4ENJRWa2JHaRLYvbLwb65OzfO5Ytjss1y3P3WRS76roAKxpR\nZ9fcVVWFe2gWl0GXveDc+6BNh6xr5dxOo65rNh8ApcAGoCznNRE4uY79tud9YIikDvE6ylDg7Xjc\nkXGbkUCcXpeJwIg4wqw/YSDAqxa63NZKGhKPc36NfaqPdSYwOWZgt7Oa9Et4eyK07QxfHw+79Nru\nLs655GyzZWNmbwJvSrrHEryB08ymSrofmEZoIb0O3A50AsZLGgUsAM6O28+UNB6YFbe/2Mwq4+Eu\nAu4E2gOPxxeErra7Jc0FVhJGs7mdVelf4KU/QItWcPZdsNuBWdfIuZ1OfQYIHC7pl0DfuL0AM7O9\nGxrUzK4ErqxRvJHQyqlt+zHAmFrKS4HBtZRvAM5qaP1cAZk7CR79UVj+0u9hnxOyrY9zO6n6JJs7\ngMsIXWiV29nWuabjw1nw92+EKWiOuQyKR253F+dcOuqTbNaY2ePb38y5JuSjD+Ges2HjWhg4HE78\nRdY1cm6nVp9k86yka4F/ELq6ADCzaanVyrnG2FQO954DaxZC78PCpJr+HBrnMlWfZHNE/FmSU2bA\niclXx7lGqqqEf1wAH7wOXfvCiHt9rjPnmoDtJhsz8yuqrvl4+hfwziPQrgt8/e/Qadesa+Sco37P\ns6m1s9vMrkq+Os41wmt/glduCkOcz/kr7Lp/1jVyzkX16UZbl7PcDjiVcBOmc03HnKfhsZ+E5S/f\n4DM4O9fE1Kcb7brc93ESzSdTq5FzO2rp9DjEuSo8xvlQf66fc01NQ4bodGDrOcmcy87aJXDPObDp\nYxh8Jpzw06xr5JyrRX2u2UwnjD6D8KCzXQG/XuOyt/HjcC/N2sXQZwic9kfwxxY51yTV55rNqTnL\nFcCHZtaYWZ+da7yqSnjg27D0LejWH0bcA63bZV0r59w2bLcbzcwWAF2BLwOnAwPTrpRz2/XkT+Ff\nj0O7rvD1+6Fjj6xr5Jyrw3aTjaRLgb8Bu8XX3yRdknbFnNumqbfB1FugRevQoum5b9Y1cs5tR326\n0UYBR5jZOgBJ1wCvADemWTHnavWvJ+GJK8LyaX+EfkdnWx/nXL3UZzSa2Hq258pY5lx+LXkL/v7N\nMMT5+NFw8DlZ18g5V0/1adn8BZgq6cH4fjjhsQPO5c+axWHk2eZ18Jlz4HOXZ10j59wOqM9Nnb+X\n9BxwTCz6ppm9nmqtnMu18aMwi/NHS2Cvo+ArN/oQZ+eamW0mG0mHAT3N7PH4OIFpsfwUSS3MrCxf\nlXQ7scoKuP9bYZaA7vvAiL9Bq7ZZ18o5t4PqumZzDTCrlvKZwLXpVMe5HGZhMMCcp6B99zCLc4fu\nWdfKOdcAdSWbXeI9NluJZT0bGlDS/pLeyHmtlfSfkrpLelrSnPizW84+oyXNlTRb0sk55cWSpsd1\nN0ihb0VSW0njYvlUSf0aWl+Xoam3wmv/By3bhCHOPfbJukbOuQaqK9l0q2Ndh4YGNLPZZnaImR0C\nFAPlwIPAFcAkMxsATIrvkTQQGAEMAoYBN0tqGQ93C3ABMCC+hsXyUcAqM9sXuJ7QSnPNyTuPwhOj\nw/LwW6DvkdnWxznXKHUlm2ckjaluLQAouAqYnFD8ocC82Fo6DRgby8cSRr0Ry+8zs41mNh+YCxwu\nqQjobGZTzMyAu2rsU32s+4GhuefhmrYOq/8VpqLB4ISfwUFnZl0l51wj1TUa7UfAn4C5kt6IZQcD\npcC3E4o/Arg3LvcysyVxeSnQKy7vCUzJ2WdRLNscl2uWV++zEMDMKiStAXoAyxOqt0vL6oXs++p/\nweZyOPhrcNyPs66Rcy4B20w2ccaAcyXtTejCAphpZu8mEVhSG+ArwOhaYpsk+/ReyZJ0IXAhQFFR\nEWVlDR9gV15e3qj9m2qsfMZrUVHO/v/8AR02ruSjHocwp/dIbNq0VGMW6u8yi3iFfG75jleQ52Zm\nmbwIXV1P5byfDRTF5SJgdlweDYzO2e5J4Mi4zTs55ecCt+VuE5dbEVo0qqs+xcXF1hilpaWN2r+p\nxspbvMpKs7+dY3ZlZ1v/P4PMylemH9MK9HeZUbxCPrd8x2tO5waUWj0+8xvy8LSknMuWLjSAicDI\nuDwSmJBTPiKOMOtPGAjwqoUut7WShsTrMefX2Kf6WGcCk+MvxTVVz/7mk1mc5x7xW2hf1/gU51xz\nU5/pahInqSNwEvCdnOKrgfGSRgELgLMBzGympPGEe34qgIvNrHqutouAO4H2wOPxBWE6nbslzQVW\nEq4NuaZq+v3w4nWglnD2WDau2iXrGjnnElavZCPpGGCAmf1F0q5AJwsjwxrEwvWgHjXKVhBGp9W2\n/RhgTC3lpcDgWso3AGc1tH4ujz54HSZcHJaH/TfsfTzksa/aOZcf9XmezZXA5Wy5kN8a+GualXI7\niY8+hHu/BhUb4LPnw+EXZl0j51xK6nPN5nTCqLF1AGb2AeD9HK5xKjbCuK/DRx/AXkfCKdf55JrO\nFbD6JJtN8eK6wSfXW5xrODN45DJY9Bp07g1n3w2t2mRdK+dciuqTbMZLug3oKukC4Bng/9Ktlito\nU26GN/4GrTvAufdCp12zrpFzLmX1eZ7N7ySdBKwF9gd+YWZPp14zV5jmPgNP/SwsD78Zij6TbX2c\nc3mx3WQj6YfAOE8wrtGWz4W/fys81vlzl8Og07OukXMuT+rTjbYL8JSkFyV9X1Kv7e7hXE3rV8O9\nI2DjGjjgVPjcFVnXyDmXR9tNNmb2KzMbBFxMmCLmeUnPpF4zVziqKuGBUbBiDuw2CE6/DVpkOXmF\ncy7fduQvfhlhNuYVwG7pVMcVpGeuDNdqOvQIAwLadsq6Rs65PKvPTZ0XSXqO8ECzHsAFZuZXdV39\nvHEvvHwjtGgFZ98F3fpmXSPnXAbqM11NH+A/zeyN7W7pXK6Fr8HDPwjLp1wL/Y7Jtj7OucxsM9lI\n6mxma4Fr4/vuuevNbGXKdXPN2ZrFYYaAyk1w2Leh5FtZ18g5l6G6Wjb3AKcCZYTZA3LnEjFg7xTr\n5Zqzzevhvq/Bxx9Cv2Nh2NVZ18g5l7G6ntR5avzZP3/Vcc2eGUz4Pix5A7r2hbPGQsvWWdfKOZex\n+gwQmFSfMucA+Of1MON+aNMJzr0POvbY/j7OuYJX1zWbdkAHoKekbmzpRusM7JmHurnmZvbjMOmq\nsHzG7dBrYLb1cc41GXVds/kO8J/AHoTrNtXJZi1wU8r1cs3NsrfhgW8DBif+DA74UtY1cs41IXVd\ns/kD8AdJl5jZjXmsk2tuyleGqWg2fQyDzoBjf5x1jZxzTUx9Zn2+UdJgYCDQLqf8rjQr5pqJys3w\n95Gw6j3Y/TNw2h/9IWjOuU+p72Ohb4yvE4D/ITy5s8EkdZV0v6R3JL0t6UhJ3SU9LWlO/NktZ/vR\nkuZKmi3p5JzyYknT47obpPApJ6mtpHGxfKqkfo2pr6vDkz+F+S9Ax13DVDRtOmRdI+dcE1SfudHO\nBIYCS83sm8DBQJdGxv0D8ISZHRCP9zZwBTDJzAYQpsa5AkDSQGAEMAgYBtwsqWU8zi3ABcCA+BoW\ny0cBq8xsX+B64JpG1tfVpuxOePU2aNEazvkbdOmddY2cc01UfZLNejOrAiokdSZMyNmnoQEldQGO\nA+4AMLNNZrYaOA0YGzcbCwyPy6cB95nZRjObD8wFDpdUBHQ2synxsdV31din+lj3A0OrWz0uIQte\nhkfjtZlTr4e9jsi2Ps65Jq0+yaZUUlfCo6DLgGnAK42I2R/4N/AXSa9L+pOkjkAvM1sSt1kKVD83\nZ09gYc7+i2LZnnG5ZvlW+5hZBbCGMImoS8Lq92Hcf0DVZhhyEXz2P7KukXOuiVNoFNRz43Dto7OZ\nvdXggFIJMAU42symSvoDYTj1JWbWNWe7VWbWTdJNwBQz+2ssvwN4HHgPuNrMPh/LjwUuN7NTJc0A\nhpnZorhuHnCEmS2vUZcLgQsBioqKih9++OGGnhbl5eV06JCf6xX5jFUzXouK9ez/0g/osHYea3sW\nM+eIq6FFy+0coeHx0pbl77LQ4hXyueU7XnM6t5KSkjIzK9nuhmZW6wv4bF2vbe23vRewO/Bezvtj\ngUeB2UBRLCsCZsfl0cDonO2fBI6M27yTU34ucFvuNnG5FbCcmFi39SouLrbGKC0tbdT+TTXWVvEq\nK83uO8/sys5mfzjErHxluvHyILPfZQHGK+Rzy3e85nRuQKnV47O/rqHP19WVo4ATt5vJatvRbKmk\nhZL2N7PZhMEHs+JrJHB1/Dkh7jIRuEfS7wk3mA4AXjWzSklrJQ0BpgLnE0bMVe8zktDddyYwOf5S\nXGO8cC28PRHadg5T0bTvtv19nHOOum/qPCHFuJcAf5PUBngX+Cbh+tF4SaOABcDZsR4zJY0nJKMK\n4GIzq4zHuQi4E2hP6Fp7PJbfAdwtaS6wkjCazTXGrInw3G8BwVfvgF33z7pGzrlmZLs3dUo6v7Zy\na8RNnRYexFZbH9/QbWw/BhhTS3kpMLiW8g3AWQ2tn9ta+zXz4IlLw5uTfgX7fSHbCjnnmp36PKnz\nsJzldoSEMI0w1NgVunXL2ee1n8HmcvjMOXDUD7KukXOuGarPdDWX5L6Pw6DvS61Grumo3Azjz6ft\n+g9hz2L48g0+FY1zrkHqc59NTesI98q4QvfUz2DBS2xq2yPMENC63fb3cc65WtTnms3DhNFnEJLT\nQGB8mpVyTcCb42DqrdCiNe+W/JIDOhdlXSPnXDNWn2s2v8tZrgAWWLxZ0hWoJW/Bw3FAwBevYV2L\nQdnWxznX7NXnms3zAHFetFZxubuZrUy5bi4L5Sth3NehYj0cch6UfAumTcu6Vs65Zq4+3WgXAlcB\nG4AqwhM7Ddg73aq5vKuqhAdGhbnP9jgUvnSdDwhwziWiPt1oPwEGW415xVwBmvwbmDcZOvSAs+/2\nAQHOucTUZzTaPKA87Yq4jM2aCP/8PagFnPkX6Nrgp0g459yn1KdlMxp4WdJUYGN1oZn53X2FYtk7\n8ND3wvJJV8Hen8u2Ps65glOfZHMbMBmYTrhm4wrJhjVhQMCmj2HwV+HI72ddI+dcAapPsmltZj9M\nvSYu/6qq4MHvwYq5sNtA+MqNPiDAOZeK+lyzeVzShZKKJHWvfqVeM5e+F6+D2Y9Cuy5wzl+hTces\na+ScK1D1admcG3+Ozinzoc/N3Zyn4dkxgOCMP0GPfbKukXOugNXnpk6fB63QrHw33E+DwQk/9UcG\nOOdSl8nzbFyGNq2D+84LAwP2PwWO/XHWNXLO7QT8eTY7EzOYeAksmwk99oXTb4UWDZn42znndow/\nz2ZnMuVmmPEAtOkUHhnQrkvWNXLO7ST8eTY7i/kvwFM/D8vDb4bdDsi2Ps65nYo/z2ZnsGYR/P2b\nYJVwzGUw8LSsa+Sc28lk8jwbSe8BHwGVQIWZlcR7d8YB/YD3gLPNbFXcfjQwKm7/AzN7MpYXA3cC\n7YHHgEvNzCS1JVxTKgZWAOeY2XuNqXOztXkDjPsPKF8Oe58AJ/486xo553ZC2+xGk7SvpKPN7Pmc\n10tAX0lJ3JRxgpkdYmYl8f0VwCQzGwBMiu+RNBAYAQwChgE3S2oZ97kFuAAYEF/DYvkoYJWZ7Qtc\nD1yTQH18p8JaAAAZCklEQVSbHzN47MfwwTTouhec+Wdo0XL7+znnXMLqumbzv8DaWsrXxnVJOw0Y\nG5fHAsNzyu8zs41mNh+YCxwuqQjobGZTzMwILZnhtRzrfmCotBPOw1L2F3j9bmjVLswQ0MEnfnDO\nZUPhc7qWFdJrZnbYNtZNN7ODGhxUmg+sIXSL3WZmt0tabWZd43oRWiZdJd0ETDGzv8Z1dwCPE7ra\nrjazz8fyY4HLzexUSTOAYdXdfZLmAUfUfCZPfDDchQBFRUXFDz/8cENPifLycjp06NDg/ZOO1XHl\nTPZ7+TJaWAXzDx3Nyt4npRovSU3td+nxml6sQo/XnM6tpKSkLKeHatvMrNYXMKeOdXO3ta4+L2DP\n+HM34E3gOGB1jW1WxZ83AefllN8BnAmUAM/klB8LPBKXZwC9c9bNA3rWVafi4mJrjNLS0kbtn2is\ntUvNfre/2ZWdzR79SfrxEtakfpcer0nGKvR4zencgFKrx+d+Xd1opZIuqFko6dtA2XazWB3MbHH8\nuQx4EDgc+DB2jRF/LoubLwZyn+TVO5Ytjss1y7faR1IroAthoEDhq9wMf/8GfLQE9joKTh6TdY2c\nc67OZPOfwDclPSfpuvh6nnDx/dKGBpTUUdIu1cvAFwgtkYnAyLjZSGBCXJ4IjJDUVlJ/wkCAV81s\nCbBW0pDY7XZ+jX2qj3UmMDlm4ML35E/h/ZdhlyI4605o2TrrGjnn3LaHPpvZh8BRkk4ABsfiR81s\nciNj9gIejNfrWwH3mNkTkl4DxksaBSwAzo71mClpPDCLMPT6YjOrjMe6iC1Dnx+PLwhdbXdLmgus\nJIxmK3xv3gev3gYtWsPZd8EuvbKukXPOAfWbruZZ4NmkAprZu8DBtZSvIMy7Vts+Y4BP9QeZWSlb\nEmFu+QbgrEZXtjlZ8iY8HBucp/wP9Dk82/o451wOn4WxEJSvhHHnQcUGOPQ/oPibWdfIOee24smm\nuauqhPu/Bavfhz0+C6f8zh/t7JxrcjzZNHeTfw3vPgsdesI5d0PrdlnXyDnnPsWTTXM2awL883pQ\nyzDyrEvv7e7inHNZ8GTTXC17Bx66KCx/4dfQ/9hs6+Occ3XwZNMMtdj8MYz7Omz6GAafCUMuyrpK\nzjlXJ082zU1VFf1fvxpWzIVeg+ErN/iAAOdck+fJprl56Xq6fvhyeKTzOXdDm45Z18g557bLk01z\nsuQtePa3Yfmrd0D3vbOtj3PO1ZMnm+aiYiM8+F2oqmBZv+EwoOGPDHDOuXzzZNNcPHc1LJsJ3fdm\n8YGfmozbOeeaNE82zcHC1+Cl/wW1gOG3UtWqfdY1cs65HeLJpqnbVA4PfResCo66BPY6IusaOefc\nDvNk09RNuioMc971QDj+v7KujXPONYgnm6Zs/gsw9RZo0QpOv8XnPXPONVuebJqqjR/BQxeH5eN+\nAnscmm19nHOuETzZNFVP/hTWvA9FB8OxP8q6Ns451yiebJqiOU/DtLHQsg2cfhu0bJ11jZxzrlE8\n2TQ15SthwvfD8ok/g90OzLY+zjmXgMySjaSWkl6X9Eh8313S05LmxJ/dcrYdLWmupNmSTs4pL5Y0\nPa67QQozUkpqK2lcLJ8qqV++z6/BHr8cPl4KfY6AI7+fdW2ccy4RWbZsLgXeznl/BTDJzAYAk+J7\nJA0ERgCDgGHAzZJaxn1uAS4ABsTXsFg+ClhlZvsC1wPXpHsqCZk1AaaPh1btYfgt0KLl9vdxzrlm\nIJNkI6k38CXgTznFpwFj4/JYYHhO+X1mttHM5gNzgcMlFQGdzWyKmRlwV419qo91PzC0utXTZH38\nb3jksrB80lXQY59s6+OccwlS+JzOc1DpfuC/gV2AH5vZqZJWm1nXuF6ElklXSTcBU8zsr3HdHcDj\nwHvA1Wb2+Vh+LHB5PNYMYJiZLYrr5gFHmNnyGvW4ELgQoKioqPjhhx9u8DmVl5fToUOHhu1sxt6l\nv6Db0pdY2/NQ5gy5NkxNk0asBijkeIV8bvmOV8jnlu94zencSkpKysysZHvbtWrQ0RtB0qnAMjMr\nk3R8bduYmUlKPQua2e3A7QAlJSVWXFzc4GOVlZXR4P3fHAdLX4I2u9D5vLso7rpXerEaoJDjFfK5\n5TteIZ9bvuMV4rnlPdkARwNfkXQK0A7oLOmvwIeSisxsSewiWxa3Xwz0ydm/dyxbHJdrlufus0hS\nK6ALsCKtE2qUNYvhsZ+E5WH/DdtJNM451xzl/ZqNmY02s95m1o9w4X+ymZ0HTARGxs1GAhPi8kRg\nRBxh1p8wEOBVM1sCrJU0JHa7nV9jn+pjnRlj5L+/cHvMYOIlsHENDDgZDj0v6xo551wqsmjZbMvV\nwHhJo4AFwNkAZjZT0nhgFlABXGxmlXGfi4A7gfaE6ziPx/I7gLslzQVWEpJa0zNtLMybBO26wldu\ngCY+hsE55xoq02RjZs8Bz8XlFcDQbWw3BhhTS3kpMLiW8g3AWQlWNXmr3gtT0gB86TrYZfdMq+Oc\nc2nyGQSyUFUVJtnc9DEMHA6Dv5p1jZxzLlWebLLw6m2w4J/QcVf40u+9+8w5V/A82eTb8jnwzC/D\n8pdvgI49Mq2Oc87lgyebfKqsgAe/CxUb4OCvwQGnZF0j55zLC082+fTyH2BxKXTeM9xT45xzOwlP\nNvmydAY8GxPMV26E9l2zrY9zzuWRJ5t8qNgUus+qNkPJKNi31hHezjlXsDzZ5MML/wMfTodu/cKM\nzs45t5PxZJO2RWXw4u8BhWfUtO2UdY2ccy7vPNmkafN6eOi7YJVw5MXQ96isa+Scc5nwZJOmyb+B\n5f+CnvvDiT/PujbOOZcZTzZpee8leOWPoJZw+i3Qul3WNXLOucx4sknDxo/hoe8BBsf+CPbM30OQ\nnHOuKfJkk4anfw6rF8DuB8FxP8m6Ns45lzlPNkmb+wyU/hlatIbTb4NWbbKukXPOZc6TTZLWr4YJ\nl4TlE0ZDr0HZ1sc555oITzZJeuIK+OgD2LMEjro069o451yT4ckmIV2W/BPevBdatYPTb4WWTemJ\n2845ly1PNklYt5y+b10flj//S+g5IMvaOOdck5P3ZCOpnaRXJb0paaakX8Xy7pKeljQn/uyWs89o\nSXMlzZZ0ck55saTpcd0NUnjkpaS2ksbF8qmS+qV2QmbwyGW03rQK+h4Dh38ntVDOOddcZdGy2Qic\naGYHA4cAwyQNAa4AJpnZAGBSfI+kgcAIYBAwDLhZUst4rFuAC4AB8TUslo8CVpnZvsD1wDWpnc2M\nB+DtiVS2bA/D/wgtvLHonHM15f2T0YKP49vW8WXAacDYWD4WGB6XTwPuM7ONZjYfmAscLqkI6Gxm\nU8zMgLtq7FN9rPuBodWtnsR17Qs99mXRoO+FWZ2dc859SiZfwyW1lPQGsAx42symAr3MbEncZCnQ\nKy7vCSzM2X1RLNszLtcs32ofM6sA1gA9UjgV6HMYfPefLN/rS6kc3jnnCkEmQ6bMrBI4RFJX4EFJ\ng2usN0mWdj0kXQhcCFBUVERZWVmDj1W+fn2j9t+hWOXleYtV6PEK+dzyHa+Qzy3f8Qry3Mws0xfw\nC+DHwGygKJYVAbPj8mhgdM72TwJHxm3eySk/F7gtd5u43ApYDqiuehQXF1tjlJaWNmr/phqr0OMV\n8rnlO14hn1u+4zWncwNKrR6f9VmMRts1tmiQ1B44CXgHmAiMjJuNBCbE5YnAiDjCrD9hIMCrFrrc\n1koaEq/HnF9jn+pjnQlMjr8U55xzGciiG60IGBtHlLUAxpvZI5JeAcZLGgUsAM4GMLOZksYDs4AK\n4GIL3XAAFwF3Au2Bx+ML4A7gbklzgZWE0WzOOecykvdkY2ZvAYfWUr4CGLqNfcYAY2opLwUG11K+\nATir0ZV1zjmXCL8pxDnnXOo82TjnnEudJxvnnHOpkw/SCiT9mzAwoaF6EoZY50M+YxV6vEI+t3zH\nK+Rzy3e85nRufc1s1+1t5MkmIZJKzayk0GIVerxCPrd8xyvkc8t3vEI8N+9Gc845lzpPNs4551Ln\nySY5txdorEKPV8jnlu94hXxu+Y5XcOfm12ycc86lzls2zjnnUufJxjnnXOo82bidhqRMnt/kXFMh\naa861h2bamy/ZrPj6voHAzCz91OM3RNYkdYjEyTtCvQF5prZ6jRi7EBddjezpQkeb5qZfTap4zUl\nkg4zs9fyGK97Has3mtm6hOPl9W9O0lNm9oUkj9kUSHoXuBW4rnr2fEm9gOuAA9K818a/6TXMo4AB\nyikzYFdgN6BlEkEkDQGuJjwm4dfA3YQ7fVtIOt/MnkgiTk68bwO/BeYB/SVdaGYTk4yxg+4Aknze\ntra/SUKBpBsJ/ydqs5HwO/6bmX2UUMjbJXUC7gPuNbNZCR13W8r49N9AtVbhEVNcYWZ/SyheXv7m\ncmz3jvikSLqhrvVm9oMEwxUTPlPekHQpcBDwQ+B/CM8ES423bBIgqR9wOfB54AYzuzGh45YC/wV0\nIQxN/KKZTZF0AOED5VOPamhkvBnACWb2b0l7Ez4Mj0wyRpYkLQJ+v631ZrbNdQ2INbKO1a2AQcBB\nZnZSgjH3Jzy76RxgM3AvcJ+ZvZdUjB2oy67A82Y2MKXj9yOFv7mc479LeIJwrczsHwnG2gTMAMYD\nH1AjgZvZ2KRi5cS8FLg+xhtiZouSjlGTt2waQdIA4KfAEYRm6A/MbHOCIVqZ2VMx1lVmNgXAzN6J\n3xyTtsnM/h1jvCupbRpBMtQS6EQeWjj1+YCQ9FjCMWcDvwJ+JelgQuKZJGmpmR2dZKztdGuZmS2U\ndHmSMWPctP/mqnUBTqX2/ysGJJZsCA+UPIvwJaECGAfcn0Y3dnxK8jWE398w4BTgcUmXmtnkpOPl\n8mTTAJIGE/7DDyI0P0flPD00SVU5y+trrEujSdq7RpN+q/cJN+ezsMTMrspXsNi6uRTYPxa9TfgW\nfheAmZ2SUtwWhK6lXkBHYFkKYbbbrWVmDycVLI9/c9UWmNm3Ujz+J+KDI28FbpXUm/AlYZaky83s\n7oTDTQNuJjzxuAJ4StIhwM2SFpjZuQnH+4Qnm4Z5E1hI+IM7HDg8t6WR4IfywZLWEv6g28dl4vt2\nCcXI9ZMa78tSiJGlfF6zGQn8J6E/fFqM/VngWkmWwodI9Wiic4HhwHTC9ZvLzGxN0rHM7KAasfux\npVvrt0nHI39/c9Xy9n/lk4DSZwn/ficRHnGfxt/fcTW7zMzsDeAoSRekEO8Tfs2mASR9gzpaFmn0\nsbrGk3S2mY2Py/3NbH7OujMS7oefAoyoeb0kfijfZ2ZDkooVj7uQ8IiM+4DxZpZGa6a2uDW7tcam\n0a21nWtgif/NSRpsZjNqKW8BnJvgwAckXUUYCPM24d/vidjqKCiebJqh2O96sZmNSeHYdXb9NGe5\nQ59rDoNOeli0pFnbujhe17pGxOtrZo15HtOOxqvZrXVvyt1aubE7AZjZxynG6AxcDOwJTASeBr4P\n/Ah408xOSzBWFTAfKI9F1R/KIlz/+kxSsbLk3WgNIOlhtm7ZGOHBQ8+a2V8TjNMH+DmwB/AQYXTR\nVYQhivckFScnXt67fvJM21iu7X1j1bzGVt91DWJmC/L8RSHf3VpI+h4wmnAdCkkfA9eY2c1JxyLc\nZrAKeAX4NmFUqIDhsdspSf0TPl6T5MmmYX5XS1l34LzY/L4ioTh3Ac8DDxBGjpQCbxCGzCZ2s2OO\n7wGn1+j6mSzpq4TmfXNPNjW/IGxrXRIOlPRWLeUC9k44VhZfFPJy8byapJ8BRwHHm9m7sWxv4A+S\nupvZbxIOuXf1dSlJfwKWAHuZ2YaE45DPFmmWvBstQZJaAmVmdkhCx3vTzA7Oeb+I8B++qo7dGhMv\nr10/+SZpNfAC4YP42LhMfH+MmXVLMFbf2oqBPsDopEei5fsaUY0Y+ejWmg0cXPPDXlJ7QrfWfgnH\nS7WbtUasj9hGTwlweRyt1ux5yyZBZlaZ9P0vkrqxpYtnBdBFMYiZrUw0WJ67fjKQ289es3VaW2u1\nwXK/rUo6FPga4V6K+YSWatI613bzppm9F68/JC7P3VpWW6vCzNbHax5Jyx0JCltGg1ZfR0nsd2pm\nu9Qsi3/33yAMiT4rqVhZ8mTTAKp9XqhuhGspMxMM1YUw/DE3g02LP43ku2Py2vWTb2b2fPVyvMOd\n6ptYkyZpP8Iw1nMJ31LHEXoSTkgjHnn+opBBt9ZiSUPNbFKNepxI6OJKlJklPf3NjsZfBVwv6T+y\nrEeSvButASTNZ+sb2ozQ6ngW+I2Zrd3Wvk1Zvrt+8i22CH8BXEKY8VyEO7ZvTPpmz/ht+0XCzYdz\nY9m7ZpZK0pZUDsytbRXh+kPHhOPlu1trEDAB+Cdb7j8pAY4GTjOzJL/kIakd8F1gX+At4M/5Ho4s\nqTWhW95Ho+2szCwvo0cknVc9uk3S0Wb2Us6675vZTUnGy6DrJ98uA44BDqu+xyZ+G79F0mVmdn2C\nsc4g3An+rKQnCAMs0rxR8MBayj75opBCvLx2a5nZzDjc+muE4dYQrrl9J42L9sBYwvxyLxKmdBlE\nGOmXOEln1FLcjTB9zf1pxMyCt2waSNJuhHH41f/xZwJ/TPJmunzeFxKPWVvXz4/NrLYWT7Mj6XXg\nJDNbXqN8V+ApS3hi03jsjoRrRecCJxJGGD5occ67NNT2RSHpLyaSJgG/raVbayjwsxS7C2vWI/Gb\nLONxp+eMRmsFvJriAIG/1Ciq7il5zsweTSNmFrxl0wCSjibc53In4cMDwtTdr0r6em4LpLGhtrFc\n2/skvEP4JndqTtfPZSnEyUrrmokGwnWb2GWROAvPdbkHuCde9D2LMK1Loskmg2tEPwAmSKq1Wyvp\nYDVuspwAPBPf/5hwz0+iyYbQqgHAzCqSHviTy8y+mdrBmxBv2TRAHGb6PTN7vUb5IcBtZnZEQnHy\n3bIZTuj6ORqo7vr5U766DdNW1+8szaGt+ZDBNaJ9gd2B/djSup8FzCZMeDov4XgT2HKT5VDCZJ8C\nLk3hJkskVQLVD4AT0J5wh3/io9Ek/aKO1WZmv04qVpY82TRAvu5HybnoK2AftlwATuWib07cvHf9\n5EOND5CtVgHtzCyV1k0+5PuLgqRHCINGptcoP4jQvfblhOPldmu1JMWbLPNN0o9qKe4IjAJ6mFmn\nPFcpFZ5sGkDS28BRcXhibnl34GUzOyChOI8RZtBdRC13uOfjzuOcrp9zzGxo2vFc4+Tri4Kk18zs\nsG2s+yQxJBgvbzdZZknSLoSBCKMID1O7LsnrwFnyZNMAki4ELiD0F1ff91JMeCjRn83stoTiXEr4\ntlpE+I93b82uO+e2Jc0vCpLmmNmAbayba2b7JhyvulX6yU2WpNStlYX4RfWHwNcJI+H+UPPLbHPn\nyaaBJJ0K/D+2Ho12rSX4wKicWH0JSWcE4Y/sXkLi+VfSsZyrD0n3ApPN7P9qlH+bMOLvnGxq1vxI\nupYwVP52wojW1Kb9yZInm2YmDmv9M/CZrO9ydjsvSb2AB4FNbD0arQ1hMtdEJ4ptCjdZpiUO7thI\nuME49wO5IFpt1TzZNEC+R4/Ecf5fJLRshgLPEVo2E5KM49yOknQCMDi+nWkpPcde0ji23GT5RcJj\nm1O5ydKlw5NNA+Rr9IikkwgXek8BXiWMMJoQ791wbqeRz5ssXTr8ps4GMLPrqpdzRo98k5AMrtvW\nfg0wmnBD4I8K7WKhczsobzdZunR4y6aBdobRI841Ffm8ydKlw1s2DVBj9MhBhTp6xLmmwgfDNH/e\nsmmAnWX0iHPOJcWTjXPOudS1yLoCzjnnCp8nG+ecc6nzZONcCiT9VNJMSW9JekNSIo+d2Eas5ySV\npHV855Lgo9GcS5ikI4FTgc+a2UZJPQnTuDi30/KWjXPJKwKWm9lGADNbbmYfSPqFpNckzZB0u+Kd\nibFlcr2kUklvSzpM0j8kzZH0m7hNP0nvSPpb3OZ+SR1qBpb0BUmvSJom6e+SOsXyqyXNii2t3+Xx\nd+Ec4MnGuTQ8BfSR9C9JN0v6XCy/ycwOM7PBhJsST83ZZ5OZlQC3Eh57fDFhzrFvSOoRt9kfuNnM\nDgTWAhflBo0tqJ8Bn49TuZQCP4z7nw4MMrPPAL9J4Zydq5MnG+cSFm/yLQYuBP4NjJP0DeAESVMl\nTSc82GxQzm4T48/phAktl8SW0btAn7huoZm9FJf/ChxTI/QQYCDwkqQ3gJFAX2ANsAG4Q9IZhDvv\nncsrv2bjXArMrJIwO/dzMbl8B/gMUGJmCyX9EmiXs8vG+LMqZ7n6ffXfac2b4mq+F/C0mZ1bsz6S\nDifMGH4m8H1CsnMub7xl41zCJO0vKfcplocAs+Py8ngd5cwGHHqvOPgA4GvAP2usnwIcLWnfWI+O\nkvaL8bqY2WPAZcDBDYjtXKN4y8a55HUCbpTUlTCl0VxCl9pqYAawFHitAcedDVws6c/ALOCW3JVm\n9u/YXXevpLax+GfAR8CE+AAyESaQdS6vfLoa55oBSf2AR+LgAueaHe9Gc845lzpv2TjnnEudt2yc\nc86lzpONc8651Hmycc45lzpPNs4551LnycY551zqPNk455xL3f8HWAN68PHdQTsAAAAASUVORK5C\nYII=\n",
      "text/plain": [
       "<matplotlib.figure.Figure at 0x1ec484ef400>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "tag_fd.plot(cumulative=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [],
   "source": [
    "nltk.app.concordance()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "brown_news_tagged = brown.tagged_words(categories='news', tagset='universal')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "metadata": {},
   "outputs": [],
   "source": [
    "word_tag_pairs = nltk.bigrams(brown_news_tagged)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "metadata": {},
   "outputs": [],
   "source": [
    "noun_preceders = [a[1] for (a, b) in word_tag_pairs if b[1] == 'NOUN']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "fdist = nltk.FreqDist(noun_preceders)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['NOUN',\n",
       " 'DET',\n",
       " 'ADJ',\n",
       " 'ADP',\n",
       " '.',\n",
       " 'VERB',\n",
       " 'CONJ',\n",
       " 'NUM',\n",
       " 'ADV',\n",
       " 'PRT',\n",
       " 'PRON',\n",
       " 'X']"
      ]
     },
     "execution_count": 79,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[tag for (tag, _) in fdist.most_common()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['is',\n",
       " 'said',\n",
       " 'was',\n",
       " 'are',\n",
       " 'be',\n",
       " 'has',\n",
       " 'have',\n",
       " 'will',\n",
       " 'says',\n",
       " 'would',\n",
       " 'were',\n",
       " 'had',\n",
       " 'been',\n",
       " 'could',\n",
       " \"'s\",\n",
       " 'can',\n",
       " 'do',\n",
       " 'say',\n",
       " 'make',\n",
       " 'may',\n",
       " 'did',\n",
       " 'rose',\n",
       " 'made',\n",
       " 'does',\n",
       " 'expected',\n",
       " 'buy',\n",
       " 'take',\n",
       " 'get',\n",
       " 'might',\n",
       " 'sell',\n",
       " 'added',\n",
       " 'sold',\n",
       " 'help',\n",
       " 'including',\n",
       " 'should',\n",
       " 'reported',\n",
       " 'according',\n",
       " 'pay',\n",
       " 'compared',\n",
       " 'being',\n",
       " 'fell',\n",
       " 'began',\n",
       " 'based',\n",
       " 'used',\n",
       " 'closed',\n",
       " \"'re\",\n",
       " 'want',\n",
       " 'see',\n",
       " 'took',\n",
       " 'yield',\n",
       " 'offered',\n",
       " 'set',\n",
       " 'priced',\n",
       " 'approved',\n",
       " 'come',\n",
       " 'noted',\n",
       " 'cut',\n",
       " 'ended',\n",
       " 'found',\n",
       " 'increased',\n",
       " 'become',\n",
       " 'think',\n",
       " 'named',\n",
       " 'go',\n",
       " 'trying',\n",
       " 'proposed',\n",
       " 'received',\n",
       " 'growing',\n",
       " 'declined',\n",
       " 'held',\n",
       " 'give',\n",
       " 'came',\n",
       " 'use',\n",
       " 'put',\n",
       " 'making',\n",
       " 'continue',\n",
       " 'raise',\n",
       " 'estimated',\n",
       " 'called',\n",
       " 'paid',\n",
       " 'designed',\n",
       " 'going',\n",
       " 'expects',\n",
       " 'seeking',\n",
       " 'must',\n",
       " 'plans',\n",
       " 'wo',\n",
       " 'increasing',\n",
       " 'saying',\n",
       " 'got',\n",
       " 'owns',\n",
       " 'trading',\n",
       " 'acquired',\n",
       " 'gained',\n",
       " 'fined',\n",
       " 'reached',\n",
       " 'holding',\n",
       " 'announced',\n",
       " 'filed',\n",
       " 'became',\n",
       " 'seek',\n",
       " 'included',\n",
       " 'using',\n",
       " 'led',\n",
       " 'decided',\n",
       " 'keep',\n",
       " 'disclosed',\n",
       " 'agreed',\n",
       " 'find',\n",
       " 'failed',\n",
       " 'run',\n",
       " 'taken',\n",
       " 'know',\n",
       " 'coming',\n",
       " \"'ve\",\n",
       " 'completed',\n",
       " 'built',\n",
       " 'raised',\n",
       " 'traded',\n",
       " 'lost',\n",
       " 'continued',\n",
       " 'paying',\n",
       " 'include',\n",
       " 'believe',\n",
       " 'receive',\n",
       " 'posted',\n",
       " 'wants',\n",
       " 'scheduled',\n",
       " 'went',\n",
       " 'indicated',\n",
       " 'provide',\n",
       " 'helped',\n",
       " 'needed',\n",
       " 'goes',\n",
       " 'told',\n",
       " 'result',\n",
       " 'need',\n",
       " 'caused',\n",
       " 'continues',\n",
       " 'dropped',\n",
       " 'showed',\n",
       " 'ordered',\n",
       " 'changed',\n",
       " 'face',\n",
       " 'continuing',\n",
       " 'launched',\n",
       " 'gives',\n",
       " 'reduce',\n",
       " \"'m\",\n",
       " 'lead',\n",
       " 'planned',\n",
       " 'wanted',\n",
       " 'following',\n",
       " 'remains',\n",
       " 'followed',\n",
       " 'remain',\n",
       " 'meet',\n",
       " 'believes',\n",
       " 'trade',\n",
       " 'includes',\n",
       " 'improve',\n",
       " 'buying',\n",
       " 'issued',\n",
       " 'rise',\n",
       " 'leading',\n",
       " 'ca',\n",
       " 'involved',\n",
       " 'known',\n",
       " 'like',\n",
       " 'makes',\n",
       " 'having',\n",
       " 'rejected',\n",
       " 'rising',\n",
       " 'increase',\n",
       " 'turned',\n",
       " 'operating',\n",
       " 'read',\n",
       " 'feel',\n",
       " 'win',\n",
       " 'given',\n",
       " 'prevent',\n",
       " 'offset',\n",
       " 'barred',\n",
       " 'earned',\n",
       " 'consented',\n",
       " 'support',\n",
       " 'gave',\n",
       " 'totaled',\n",
       " 'acquire',\n",
       " 'required',\n",
       " 'begin',\n",
       " 'require',\n",
       " 'offer',\n",
       " 'preferred',\n",
       " 'produced',\n",
       " 'bought',\n",
       " 'offering',\n",
       " 'asked',\n",
       " 'carry',\n",
       " 'build',\n",
       " 'takes',\n",
       " 'seem',\n",
       " 'introduced',\n",
       " 'taking',\n",
       " 'won',\n",
       " 'aimed',\n",
       " 'hurt',\n",
       " 'adds',\n",
       " 'cited',\n",
       " 'sought',\n",
       " 'bring',\n",
       " 'remaining',\n",
       " 'considered',\n",
       " 'suspended',\n",
       " 'prove',\n",
       " 'looking',\n",
       " 'doing',\n",
       " 'involving',\n",
       " 'opened',\n",
       " 'working',\n",
       " 'close',\n",
       " 'own',\n",
       " 'report',\n",
       " 'left',\n",
       " 'boosted',\n",
       " 'giving',\n",
       " 'fixed',\n",
       " 'listed',\n",
       " 'runs',\n",
       " 'purchasing',\n",
       " 'consider',\n",
       " 'prepared',\n",
       " 'hit',\n",
       " 'getting',\n",
       " 'alleged',\n",
       " 'look',\n",
       " 'allowed',\n",
       " 'approve',\n",
       " 'wrote',\n",
       " 'reduced',\n",
       " 'fall',\n",
       " 'advanced',\n",
       " 'appears',\n",
       " 'mixed',\n",
       " 'described',\n",
       " 'expect',\n",
       " 'manufacturing',\n",
       " 'spent',\n",
       " 'According',\n",
       " 'hopes',\n",
       " 'underlying',\n",
       " 'produce',\n",
       " 'work',\n",
       " 'placed',\n",
       " 'allow',\n",
       " 'sells',\n",
       " 'operate',\n",
       " 'extend',\n",
       " 'surged',\n",
       " 'jumped',\n",
       " 'boost',\n",
       " 'slowing',\n",
       " 'provided',\n",
       " 'seems',\n",
       " 'ending',\n",
       " 'selling',\n",
       " 'opposed',\n",
       " 'created',\n",
       " 'move',\n",
       " 'seen',\n",
       " 'comment',\n",
       " 'valued',\n",
       " 'losing',\n",
       " 'mature',\n",
       " 'provides',\n",
       " 'let',\n",
       " 'stopped',\n",
       " 'worked',\n",
       " 'thought',\n",
       " 'watch',\n",
       " 'introduce',\n",
       " 'related',\n",
       " 'improved',\n",
       " 'raising',\n",
       " 'seemed',\n",
       " 'force',\n",
       " 'beginning',\n",
       " 'leave',\n",
       " 'believed',\n",
       " 'stand',\n",
       " 'developed',\n",
       " 'decline',\n",
       " 'expire',\n",
       " 'managing',\n",
       " 'hold',\n",
       " 'invested',\n",
       " 'suggests',\n",
       " 'represent',\n",
       " 'settle',\n",
       " 'change',\n",
       " 'contributed',\n",
       " 'indicates',\n",
       " 'asking',\n",
       " 'elaborate',\n",
       " 'shows',\n",
       " 'refused',\n",
       " 'quoted',\n",
       " 'comes',\n",
       " 'ease',\n",
       " 'passed',\n",
       " 'Says',\n",
       " 'avoid',\n",
       " 'threatened',\n",
       " 'cause',\n",
       " 'end',\n",
       " 'violate',\n",
       " 'operates',\n",
       " 'kept',\n",
       " \"'ll\",\n",
       " 'soared',\n",
       " 'eliminated',\n",
       " 'becomes',\n",
       " 'create',\n",
       " 'print',\n",
       " 'shall',\n",
       " 'show',\n",
       " 'replaced',\n",
       " 'owned',\n",
       " 'argue',\n",
       " 'beat',\n",
       " 'elected',\n",
       " 'complete',\n",
       " 'issue',\n",
       " 'act',\n",
       " 'return',\n",
       " 'registered',\n",
       " 'suffer',\n",
       " 'worried',\n",
       " 'succeed',\n",
       " 'block',\n",
       " 'contain',\n",
       " 'occur',\n",
       " 'pursue',\n",
       " 'combined',\n",
       " 'requires',\n",
       " 'met',\n",
       " 'brought',\n",
       " 'started',\n",
       " 'covered',\n",
       " 'turn',\n",
       " 'running',\n",
       " 'eliminate',\n",
       " 'file',\n",
       " 'plunged',\n",
       " 'fallen',\n",
       " 'ran',\n",
       " 'fired',\n",
       " 'becoming',\n",
       " 'contained',\n",
       " 'managed',\n",
       " 'Take',\n",
       " 'suggested',\n",
       " 'accused',\n",
       " 'appeared',\n",
       " 'slow',\n",
       " 'helping',\n",
       " 'discovered',\n",
       " 'add',\n",
       " 'referred',\n",
       " 'oppose',\n",
       " 'stop',\n",
       " 'claim',\n",
       " 'sent',\n",
       " 'formed',\n",
       " 'resulting',\n",
       " 'turning',\n",
       " 'limited',\n",
       " 'shipped',\n",
       " 'forced',\n",
       " 'send',\n",
       " 'attract',\n",
       " 'admitting',\n",
       " 'denying',\n",
       " 'disgorge',\n",
       " 'attributed',\n",
       " 'causing',\n",
       " 'studied',\n",
       " 'resigned',\n",
       " 'cutting',\n",
       " 'voted',\n",
       " 'settled',\n",
       " 'expand',\n",
       " 'stood',\n",
       " 'retired',\n",
       " 'moved',\n",
       " 'pending',\n",
       " 'providing',\n",
       " 'anticipated',\n",
       " 'decide',\n",
       " 'creating',\n",
       " 'prompted',\n",
       " 'developing',\n",
       " 'start',\n",
       " 'maintained',\n",
       " 'expanding',\n",
       " 'follows',\n",
       " 'ranged',\n",
       " 'focused',\n",
       " 'climbed',\n",
       " 'reflect',\n",
       " 'insist',\n",
       " 'owed',\n",
       " 'happen',\n",
       " 'adjusted',\n",
       " 'awarded',\n",
       " 'reporting',\n",
       " 'talk',\n",
       " 'offers',\n",
       " 'written',\n",
       " 'urged',\n",
       " 'carried',\n",
       " 'identified',\n",
       " 'confirmed',\n",
       " 'playing',\n",
       " 'thinking',\n",
       " 'calls',\n",
       " 'means',\n",
       " 'tried',\n",
       " 'lying',\n",
       " 'asks',\n",
       " 'building',\n",
       " 'suggest',\n",
       " 'falling',\n",
       " 'discuss',\n",
       " 'matched',\n",
       " 'concluded',\n",
       " 'keeping',\n",
       " \"'d\",\n",
       " 'returned',\n",
       " 'withdrawn',\n",
       " 'bid',\n",
       " 'saw',\n",
       " 'signed',\n",
       " 'financing',\n",
       " 'assuming',\n",
       " 'adopted',\n",
       " 'attempting',\n",
       " 'accepted',\n",
       " 'cover',\n",
       " 'facing',\n",
       " 'risk',\n",
       " 'expanded',\n",
       " 'leaving',\n",
       " 'raises',\n",
       " 'declared',\n",
       " 'exercise',\n",
       " 'finished',\n",
       " 'regarding',\n",
       " 'finance',\n",
       " 'charge',\n",
       " 'starting',\n",
       " 'realize',\n",
       " 'felt',\n",
       " 'remained',\n",
       " 'expressed',\n",
       " 'done',\n",
       " 'replace',\n",
       " 'veto',\n",
       " 'stay',\n",
       " 'delivered',\n",
       " 'join',\n",
       " 'publishing',\n",
       " 'enters',\n",
       " 'appear',\n",
       " 'talking',\n",
       " 'heard',\n",
       " 'dumped',\n",
       " 'imported',\n",
       " 'assume',\n",
       " 'declining',\n",
       " 'capture',\n",
       " 'grew',\n",
       " 'holds',\n",
       " 'lift',\n",
       " 'treat',\n",
       " 'receiving',\n",
       " 'joined',\n",
       " 'reflecting',\n",
       " 'released',\n",
       " 'maintaining',\n",
       " 'cost',\n",
       " 'lowered',\n",
       " 'costs',\n",
       " 'exceed',\n",
       " 'gaining',\n",
       " 'considering',\n",
       " 'determined',\n",
       " 'ruled',\n",
       " 'hope',\n",
       " 'located',\n",
       " 'tied',\n",
       " 'heads',\n",
       " 'applied',\n",
       " 'failing',\n",
       " 'showing',\n",
       " 'apply',\n",
       " 'protecting',\n",
       " 'tells',\n",
       " 'complained',\n",
       " 'ask',\n",
       " 'triggered',\n",
       " 'entered',\n",
       " 'total',\n",
       " 'producing',\n",
       " 'denied',\n",
       " 'reducing',\n",
       " 'reflects',\n",
       " 'account',\n",
       " 'predicting',\n",
       " 'intended',\n",
       " 'purchased',\n",
       " 'blamed',\n",
       " 'worry',\n",
       " 'broken',\n",
       " 'carries',\n",
       " 'learned',\n",
       " 'renewed',\n",
       " 'walk',\n",
       " 'viewed',\n",
       " 'die',\n",
       " 'speculated',\n",
       " 'needs',\n",
       " 'gets',\n",
       " 'wait',\n",
       " 'caught',\n",
       " 'claims',\n",
       " 'choose',\n",
       " 'fail',\n",
       " 'insists',\n",
       " 'knows',\n",
       " 'pass',\n",
       " 'grown',\n",
       " 'gotten',\n",
       " 'grows',\n",
       " 'responded',\n",
       " 'play',\n",
       " 'try',\n",
       " 'mean',\n",
       " 'encourage',\n",
       " 'chosen',\n",
       " 'admits',\n",
       " 'Do',\n",
       " 'dismissed',\n",
       " 'realized',\n",
       " 'serve',\n",
       " 'associated',\n",
       " 'slipped',\n",
       " 'argued',\n",
       " 'citing',\n",
       " 'seeks',\n",
       " 'preventing',\n",
       " 'sparked',\n",
       " 'review',\n",
       " 'opening',\n",
       " 'fueled',\n",
       " 'negotiate',\n",
       " 'drop',\n",
       " 'pleased',\n",
       " 'spend',\n",
       " 'care',\n",
       " 'represents',\n",
       " 'spread',\n",
       " 'explains',\n",
       " 'push',\n",
       " 'divided',\n",
       " 'proposing',\n",
       " 'gain',\n",
       " 'representing',\n",
       " 'financed',\n",
       " 'execute',\n",
       " 'existing',\n",
       " 'discussed',\n",
       " 'uses',\n",
       " 'live',\n",
       " 'ring',\n",
       " 'signal',\n",
       " 'focus',\n",
       " 'hired',\n",
       " 'limit',\n",
       " 'begins',\n",
       " 'reflected',\n",
       " 'hear',\n",
       " 'determine',\n",
       " 'profit',\n",
       " 'marketed',\n",
       " 'warned',\n",
       " 'qualified',\n",
       " 'died',\n",
       " 'surviving',\n",
       " 'study',\n",
       " 'explained',\n",
       " 'imposed',\n",
       " 'recognize',\n",
       " 'eased',\n",
       " 'indicate',\n",
       " 'permit',\n",
       " 'retain',\n",
       " 'yielding',\n",
       " 'boosts',\n",
       " 'obtain',\n",
       " 'employs',\n",
       " 'banned',\n",
       " 'pointed',\n",
       " 'leaves',\n",
       " 'withdraw',\n",
       " 'refund',\n",
       " 'collected',\n",
       " 'upheld',\n",
       " 'benefited',\n",
       " 'doubled',\n",
       " 'attached',\n",
       " 'jump',\n",
       " 'compete',\n",
       " 'incurred',\n",
       " 'removed',\n",
       " 'honor',\n",
       " 'varying',\n",
       " 'marketing',\n",
       " 'protect',\n",
       " 'reach',\n",
       " 'share',\n",
       " 'requested',\n",
       " 'grant',\n",
       " 'stepping',\n",
       " 'direct',\n",
       " 'curb',\n",
       " 'controlling',\n",
       " 'snapped',\n",
       " 'tend',\n",
       " 'cast',\n",
       " 'clear',\n",
       " 'permitted',\n",
       " 'remove',\n",
       " 'revive',\n",
       " 'draw',\n",
       " 'predicted',\n",
       " 'suspect',\n",
       " 'coupled',\n",
       " 'belong',\n",
       " 'call',\n",
       " 'describes',\n",
       " 'played',\n",
       " 'committed',\n",
       " 'advertising',\n",
       " 'tested',\n",
       " 'revived',\n",
       " 'earns',\n",
       " 'feeling',\n",
       " 'turns',\n",
       " 'executed',\n",
       " 'killed',\n",
       " 'presented',\n",
       " 'deserve',\n",
       " 'mention',\n",
       " 'seeing',\n",
       " 'discussing',\n",
       " 'convicted',\n",
       " 'telling',\n",
       " 'agree',\n",
       " 'denies',\n",
       " 'pursued',\n",
       " 'spurred',\n",
       " 'accommodate',\n",
       " 'surrendered',\n",
       " 'gone',\n",
       " 'teach',\n",
       " 'booming',\n",
       " 'serving',\n",
       " 'restore',\n",
       " 'restructured',\n",
       " 'taught',\n",
       " 'feared',\n",
       " 'meant',\n",
       " 'adding',\n",
       " 'publishes',\n",
       " 'improving',\n",
       " 'ignoring',\n",
       " 'represented',\n",
       " 'funded',\n",
       " 'involve',\n",
       " 'charged',\n",
       " 'fared',\n",
       " 'eliminates',\n",
       " 'tumbled',\n",
       " 'redeemed',\n",
       " 'resolve',\n",
       " 'stem',\n",
       " 'hire',\n",
       " 'obtained',\n",
       " 'develop',\n",
       " 'employed',\n",
       " 'prohibits',\n",
       " 'promote',\n",
       " 'impose',\n",
       " 'consist',\n",
       " 'investigating',\n",
       " 'accepting',\n",
       " 'plan',\n",
       " 'insisted',\n",
       " 'contacted',\n",
       " 'note',\n",
       " 'driving',\n",
       " 'contends',\n",
       " 'cites',\n",
       " 'point',\n",
       " 'sign',\n",
       " 'printed',\n",
       " 'advertise',\n",
       " 'breaks',\n",
       " 'damaged',\n",
       " 'check',\n",
       " 'thinks',\n",
       " 'looming',\n",
       " 'expecting',\n",
       " 'exercised',\n",
       " 'auctioned',\n",
       " 'disappointed',\n",
       " 'subordinated',\n",
       " 'respond',\n",
       " 'secured',\n",
       " 'integrated',\n",
       " 'performed',\n",
       " 'targeting',\n",
       " 'stepped',\n",
       " 'moving',\n",
       " 'split',\n",
       " 'Buy',\n",
       " 'stemming',\n",
       " 'executing',\n",
       " 'shut',\n",
       " 'writing',\n",
       " 'regulated',\n",
       " 'stands',\n",
       " 'attend',\n",
       " 'reopen',\n",
       " 'drawn',\n",
       " 'Put',\n",
       " 'notes',\n",
       " 'weaken',\n",
       " 'trailed',\n",
       " 'deliver',\n",
       " 'occurred',\n",
       " 'changing',\n",
       " 'accept',\n",
       " 'expelled',\n",
       " 'amounted',\n",
       " 'scrutinizing',\n",
       " 'suspend',\n",
       " 'compares',\n",
       " 'backed',\n",
       " 'vote',\n",
       " 'covers',\n",
       " 'knew',\n",
       " 'joining',\n",
       " 'record',\n",
       " 'regarded',\n",
       " 'copy',\n",
       " 'conclude',\n",
       " 'ought',\n",
       " 'dominated',\n",
       " 'pushed',\n",
       " 'closing',\n",
       " 'rumored',\n",
       " 'respected',\n",
       " 'specified',\n",
       " 'understand',\n",
       " 'supported',\n",
       " 'perform',\n",
       " 'declaring',\n",
       " 'struggling',\n",
       " 'abandoned',\n",
       " 'considers',\n",
       " 'warning',\n",
       " 'offsetting',\n",
       " 'break',\n",
       " 'follow',\n",
       " 'figure',\n",
       " 'increases',\n",
       " 'proving',\n",
       " 'edged',\n",
       " 'Buying',\n",
       " 'forecast',\n",
       " 'specify',\n",
       " 'extended',\n",
       " 'tendered',\n",
       " 'unveiled',\n",
       " 'treating',\n",
       " 'exposed',\n",
       " 'industrialized',\n",
       " 'regulate',\n",
       " 'contracted',\n",
       " 'blip',\n",
       " 'vary',\n",
       " 'slid',\n",
       " 'succeeds',\n",
       " 'lifted',\n",
       " 'acts',\n",
       " 'welcomed',\n",
       " 'squeezed',\n",
       " 'fed',\n",
       " 'casting',\n",
       " 'prolonged',\n",
       " 'recorded',\n",
       " 'announce',\n",
       " 'reward',\n",
       " 'bowed',\n",
       " 'justify',\n",
       " 'asserted',\n",
       " 'appealing',\n",
       " 'faces',\n",
       " 'rule',\n",
       " 'inched',\n",
       " 'manufacture',\n",
       " 'fund',\n",
       " 'anticipates',\n",
       " 'link',\n",
       " 'describe',\n",
       " 'roll',\n",
       " 'calculate',\n",
       " 'transferring',\n",
       " 'favored',\n",
       " 'claiming',\n",
       " 'hurting',\n",
       " 'investing',\n",
       " 'trained',\n",
       " 'instituted',\n",
       " 'introducing',\n",
       " 'vowed',\n",
       " 'deemed',\n",
       " 'pose',\n",
       " 'concerned',\n",
       " 'accelerated',\n",
       " 'feels',\n",
       " 'solved',\n",
       " 'forgiven',\n",
       " 'stored',\n",
       " 'assembled',\n",
       " 'totaling',\n",
       " 'linked',\n",
       " 'forces',\n",
       " 'attempts',\n",
       " 'advertised',\n",
       " 'marks',\n",
       " 'sweeping',\n",
       " 'invest',\n",
       " 'kicked',\n",
       " 'brings',\n",
       " 'scrambled',\n",
       " 'diversify',\n",
       " 'swing',\n",
       " 'skyrocketed',\n",
       " 'targeted',\n",
       " 'repaid',\n",
       " 'open',\n",
       " 'crippled',\n",
       " 'lent',\n",
       " 'belongs',\n",
       " 'stressed',\n",
       " 'leveling',\n",
       " 'manufactured',\n",
       " 'pick',\n",
       " 'cite',\n",
       " 'provoke',\n",
       " 'last',\n",
       " 'climbing',\n",
       " 'Excluding',\n",
       " 'adjusting',\n",
       " 'counts',\n",
       " 'handle',\n",
       " 'polled',\n",
       " 'drink',\n",
       " 'sets',\n",
       " 'sidestep',\n",
       " 'fare',\n",
       " 'letting',\n",
       " 'entering',\n",
       " 'ban',\n",
       " 'visiting',\n",
       " 'endorsed',\n",
       " 'balked',\n",
       " 'compensate',\n",
       " 'terminated',\n",
       " 'modify',\n",
       " 'operated',\n",
       " 'entitles',\n",
       " 'romanticized',\n",
       " 'spends',\n",
       " 'condemned',\n",
       " 'competing',\n",
       " 'returning',\n",
       " 'murdered',\n",
       " 'load',\n",
       " 'lives',\n",
       " 'recommend',\n",
       " 'fighting',\n",
       " 'fills',\n",
       " 'charges',\n",
       " 'exist',\n",
       " 'Stung',\n",
       " 'banning',\n",
       " 'admitted',\n",
       " 'talks',\n",
       " 'launch',\n",
       " 'attracted',\n",
       " 'featured',\n",
       " 'devote',\n",
       " 'featuring',\n",
       " 'suing',\n",
       " 'shrinks',\n",
       " 'tripled',\n",
       " 'pumping',\n",
       " 'contributing',\n",
       " 'spur',\n",
       " 'concentrated',\n",
       " 'export',\n",
       " 'pull',\n",
       " 'approach',\n",
       " 'step',\n",
       " 'regard',\n",
       " 'breach',\n",
       " 'pleaded',\n",
       " 'inspired',\n",
       " 'defended',\n",
       " 'treated',\n",
       " 'casts',\n",
       " 'violated',\n",
       " 'enforce',\n",
       " 'surfaced',\n",
       " 'concentrate',\n",
       " 'stressing',\n",
       " 'suffered',\n",
       " 'loved',\n",
       " 'advised',\n",
       " 'studying',\n",
       " 'pushing',\n",
       " 'earn',\n",
       " 'save',\n",
       " 'interviewed',\n",
       " 'explain',\n",
       " 'gauge',\n",
       " 'measured',\n",
       " 'deny',\n",
       " 'hampered',\n",
       " 'fill',\n",
       " 'nominated',\n",
       " 'assured',\n",
       " 'finding',\n",
       " 'conducting',\n",
       " 'tracks',\n",
       " 'merge',\n",
       " 'merged',\n",
       " 'banking',\n",
       " 'achieve',\n",
       " 'acquiring',\n",
       " 'post',\n",
       " 'wish',\n",
       " 'retained',\n",
       " 'spark',\n",
       " 'chaired',\n",
       " 'deal',\n",
       " 'submit',\n",
       " 'sending',\n",
       " 'test',\n",
       " 'relegated',\n",
       " 'alleging',\n",
       " 'mounted',\n",
       " 'harass',\n",
       " 'crossing',\n",
       " 'involves',\n",
       " 'assist',\n",
       " 'killing',\n",
       " 'served',\n",
       " 'understood',\n",
       " 'touch',\n",
       " 'Asked',\n",
       " 'design',\n",
       " 'retaining',\n",
       " 'belonging',\n",
       " 'compiled',\n",
       " 'Guaranteed',\n",
       " 'positioned',\n",
       " 'plunging',\n",
       " 'locked',\n",
       " 'starts',\n",
       " 'waiting',\n",
       " 'rolled',\n",
       " 'lock',\n",
       " 'drifted',\n",
       " 'measures',\n",
       " 'Estimated',\n",
       " ...]"
      ]
     },
     "execution_count": 80,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wsj = nltk.corpus.treebank.tagged_words(tagset='universal')\n",
    "word_tag_fd = nltk.FreqDist(wsj)\n",
    "[wt[0] for (wt, _) in word_tag_fd.most_common() if wt[1] == 'VERB']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 81,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "cfd1 = nltk.ConditionalFreqDist(wsj)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('VERB', 28), ('NOUN', 20)]"
      ]
     },
     "execution_count": 82,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cfd1['yield'].most_common()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [],
   "source": [
    "wsj = nltk.corpus.treebank.tagged_words()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "cfd2 = nltk.ConditionalFreqDist((tag, word) for (word, tag) in wsj)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "ConditionalFreqDist(nltk.probability.FreqDist,\n",
       "                    {'#': FreqDist({'#': 16}),\n",
       "                     '$': FreqDist({'$': 718, 'C$': 2, 'US$': 4}),\n",
       "                     \"''\": FreqDist({\"'\": 10, \"''\": 684}),\n",
       "                     ',': FreqDist({',': 4885, 'Wa': 1}),\n",
       "                     '-LRB-': FreqDist({'-LCB-': 14, '-LRB-': 106}),\n",
       "                     '-NONE-': FreqDist({'*': 965,\n",
       "                               '*-1': 1123,\n",
       "                               '*-10': 2,\n",
       "                               '*-100': 1,\n",
       "                               '*-101': 1,\n",
       "                               '*-102': 2,\n",
       "                               '*-103': 1,\n",
       "                               '*-104': 1,\n",
       "                               '*-105': 1,\n",
       "                               '*-106': 1,\n",
       "                               '*-107': 1,\n",
       "                               '*-108': 1,\n",
       "                               '*-109': 1,\n",
       "                               '*-11': 2,\n",
       "                               '*-110': 1,\n",
       "                               '*-111': 1,\n",
       "                               '*-112': 1,\n",
       "                               '*-113': 1,\n",
       "                               '*-114': 1,\n",
       "                               '*-115': 1,\n",
       "                               '*-116': 1,\n",
       "                               '*-117': 1,\n",
       "                               '*-118': 1,\n",
       "                               '*-119': 1,\n",
       "                               '*-12': 2,\n",
       "                               '*-120': 1,\n",
       "                               '*-121': 1,\n",
       "                               '*-122': 1,\n",
       "                               '*-123': 1,\n",
       "                               '*-124': 1,\n",
       "                               '*-125': 1,\n",
       "                               '*-126': 1,\n",
       "                               '*-127': 1,\n",
       "                               '*-128': 2,\n",
       "                               '*-129': 1,\n",
       "                               '*-13': 2,\n",
       "                               '*-130': 1,\n",
       "                               '*-131': 1,\n",
       "                               '*-132': 1,\n",
       "                               '*-133': 1,\n",
       "                               '*-134': 1,\n",
       "                               '*-135': 1,\n",
       "                               '*-136': 1,\n",
       "                               '*-137': 1,\n",
       "                               '*-138': 1,\n",
       "                               '*-139': 1,\n",
       "                               '*-14': 2,\n",
       "                               '*-140': 1,\n",
       "                               '*-141': 1,\n",
       "                               '*-142': 1,\n",
       "                               '*-144': 1,\n",
       "                               '*-145': 1,\n",
       "                               '*-146': 1,\n",
       "                               '*-147': 1,\n",
       "                               '*-149': 1,\n",
       "                               '*-15': 2,\n",
       "                               '*-150': 1,\n",
       "                               '*-151': 1,\n",
       "                               '*-152': 1,\n",
       "                               '*-153': 1,\n",
       "                               '*-154': 1,\n",
       "                               '*-155': 1,\n",
       "                               '*-156': 1,\n",
       "                               '*-157': 1,\n",
       "                               '*-158': 1,\n",
       "                               '*-159': 1,\n",
       "                               '*-16': 2,\n",
       "                               '*-160': 1,\n",
       "                               '*-161': 1,\n",
       "                               '*-162': 1,\n",
       "                               '*-163': 2,\n",
       "                               '*-164': 1,\n",
       "                               '*-165': 1,\n",
       "                               '*-166': 1,\n",
       "                               '*-17': 2,\n",
       "                               '*-18': 2,\n",
       "                               '*-19': 2,\n",
       "                               '*-2': 372,\n",
       "                               '*-20': 2,\n",
       "                               '*-21': 2,\n",
       "                               '*-22': 2,\n",
       "                               '*-23': 2,\n",
       "                               '*-24': 2,\n",
       "                               '*-25': 3,\n",
       "                               '*-26': 2,\n",
       "                               '*-27': 2,\n",
       "                               '*-28': 2,\n",
       "                               '*-29': 2,\n",
       "                               '*-3': 130,\n",
       "                               '*-30': 1,\n",
       "                               '*-31': 2,\n",
       "                               '*-32': 2,\n",
       "                               '*-33': 2,\n",
       "                               '*-34': 2,\n",
       "                               '*-35': 2,\n",
       "                               '*-36': 2,\n",
       "                               '*-37': 2,\n",
       "                               '*-38': 2,\n",
       "                               '*-39': 2,\n",
       "                               '*-4': 34,\n",
       "                               '*-40': 2,\n",
       "                               '*-41': 2,\n",
       "                               '*-42': 2,\n",
       "                               '*-43': 2,\n",
       "                               '*-44': 2,\n",
       "                               '*-45': 2,\n",
       "                               '*-46': 2,\n",
       "                               '*-47': 2,\n",
       "                               '*-48': 2,\n",
       "                               '*-49': 2,\n",
       "                               '*-5': 11,\n",
       "                               '*-50': 2,\n",
       "                               '*-51': 2,\n",
       "                               '*-52': 4,\n",
       "                               '*-53': 2,\n",
       "                               '*-54': 2,\n",
       "                               '*-55': 2,\n",
       "                               '*-56': 2,\n",
       "                               '*-57': 2,\n",
       "                               '*-58': 1,\n",
       "                               '*-59': 2,\n",
       "                               '*-6': 4,\n",
       "                               '*-60': 2,\n",
       "                               '*-61': 2,\n",
       "                               '*-62': 2,\n",
       "                               '*-63': 2,\n",
       "                               '*-64': 3,\n",
       "                               '*-66': 1,\n",
       "                               '*-67': 2,\n",
       "                               '*-68': 2,\n",
       "                               '*-69': 2,\n",
       "                               '*-7': 4,\n",
       "                               '*-70': 2,\n",
       "                               '*-71': 2,\n",
       "                               '*-72': 2,\n",
       "                               '*-73': 3,\n",
       "                               '*-74': 2,\n",
       "                               '*-75': 1,\n",
       "                               '*-76': 2,\n",
       "                               '*-77': 1,\n",
       "                               '*-78': 2,\n",
       "                               '*-79': 2,\n",
       "                               '*-8': 2,\n",
       "                               '*-80': 3,\n",
       "                               '*-81': 2,\n",
       "                               '*-82': 1,\n",
       "                               '*-83': 2,\n",
       "                               '*-84': 2,\n",
       "                               '*-85': 2,\n",
       "                               '*-86': 1,\n",
       "                               '*-87': 2,\n",
       "                               '*-88': 1,\n",
       "                               '*-89': 1,\n",
       "                               '*-9': 2,\n",
       "                               '*-90': 1,\n",
       "                               '*-91': 1,\n",
       "                               '*-92': 1,\n",
       "                               '*-93': 1,\n",
       "                               '*-94': 1,\n",
       "                               '*-95': 1,\n",
       "                               '*-96': 1,\n",
       "                               '*-97': 1,\n",
       "                               '*-98': 2,\n",
       "                               '*-99': 1,\n",
       "                               '*?*': 45,\n",
       "                               '*EXP*-1': 33,\n",
       "                               '*EXP*-2': 8,\n",
       "                               '*EXP*-3': 3,\n",
       "                               '*ICH*-1': 70,\n",
       "                               '*ICH*-2': 34,\n",
       "                               '*ICH*-3': 13,\n",
       "                               '*ICH*-4': 5,\n",
       "                               '*NOT*': 1,\n",
       "                               '*PPA*-1': 2,\n",
       "                               '*PPA*-2': 2,\n",
       "                               '*PPA*-3': 3,\n",
       "                               '*RNR*-1': 34,\n",
       "                               '*RNR*-2': 5,\n",
       "                               '*RNR*-4': 2,\n",
       "                               '*T*-1': 806,\n",
       "                               '*T*-10': 2,\n",
       "                               '*T*-100': 1,\n",
       "                               '*T*-101': 1,\n",
       "                               '*T*-102': 1,\n",
       "                               '*T*-103': 1,\n",
       "                               '*T*-104': 1,\n",
       "                               '*T*-105': 1,\n",
       "                               '*T*-106': 1,\n",
       "                               '*T*-107': 1,\n",
       "                               '*T*-108': 1,\n",
       "                               '*T*-109': 1,\n",
       "                               '*T*-11': 2,\n",
       "                               '*T*-110': 1,\n",
       "                               '*T*-111': 1,\n",
       "                               '*T*-112': 1,\n",
       "                               '*T*-113': 1,\n",
       "                               '*T*-114': 1,\n",
       "                               '*T*-115': 1,\n",
       "                               '*T*-116': 1,\n",
       "                               '*T*-117': 1,\n",
       "                               '*T*-118': 1,\n",
       "                               '*T*-119': 1,\n",
       "                               '*T*-12': 2,\n",
       "                               '*T*-120': 1,\n",
       "                               '*T*-121': 1,\n",
       "                               '*T*-122': 1,\n",
       "                               '*T*-123': 1,\n",
       "                               '*T*-124': 1,\n",
       "                               '*T*-125': 1,\n",
       "                               '*T*-126': 1,\n",
       "                               '*T*-127': 1,\n",
       "                               '*T*-128': 1,\n",
       "                               '*T*-129': 1,\n",
       "                               '*T*-13': 2,\n",
       "                               '*T*-130': 1,\n",
       "                               '*T*-131': 1,\n",
       "                               '*T*-132': 1,\n",
       "                               '*T*-133': 1,\n",
       "                               '*T*-134': 1,\n",
       "                               '*T*-135': 1,\n",
       "                               '*T*-136': 1,\n",
       "                               '*T*-137': 1,\n",
       "                               '*T*-138': 1,\n",
       "                               '*T*-139': 1,\n",
       "                               '*T*-14': 2,\n",
       "                               '*T*-140': 1,\n",
       "                               '*T*-141': 1,\n",
       "                               '*T*-142': 1,\n",
       "                               '*T*-143': 1,\n",
       "                               '*T*-144': 1,\n",
       "                               '*T*-145': 1,\n",
       "                               '*T*-146': 1,\n",
       "                               '*T*-147': 1,\n",
       "                               '*T*-148': 1,\n",
       "                               '*T*-149': 1,\n",
       "                               '*T*-15': 2,\n",
       "                               '*T*-150': 1,\n",
       "                               '*T*-151': 1,\n",
       "                               '*T*-152': 1,\n",
       "                               '*T*-153': 1,\n",
       "                               '*T*-154': 1,\n",
       "                               '*T*-155': 1,\n",
       "                               '*T*-156': 1,\n",
       "                               '*T*-157': 1,\n",
       "                               '*T*-158': 1,\n",
       "                               '*T*-159': 1,\n",
       "                               '*T*-16': 2,\n",
       "                               '*T*-160': 1,\n",
       "                               '*T*-161': 1,\n",
       "                               '*T*-162': 1,\n",
       "                               '*T*-163': 1,\n",
       "                               '*T*-164': 1,\n",
       "                               '*T*-165': 1,\n",
       "                               '*T*-166': 1,\n",
       "                               '*T*-167': 1,\n",
       "                               '*T*-168': 1,\n",
       "                               '*T*-169': 1,\n",
       "                               '*T*-17': 2,\n",
       "                               '*T*-170': 1,\n",
       "                               '*T*-171': 1,\n",
       "                               '*T*-172': 1,\n",
       "                               '*T*-173': 1,\n",
       "                               '*T*-174': 1,\n",
       "                               '*T*-175': 1,\n",
       "                               '*T*-176': 1,\n",
       "                               '*T*-177': 1,\n",
       "                               '*T*-178': 1,\n",
       "                               '*T*-179': 1,\n",
       "                               '*T*-18': 2,\n",
       "                               '*T*-180': 1,\n",
       "                               '*T*-181': 1,\n",
       "                               '*T*-182': 1,\n",
       "                               '*T*-183': 1,\n",
       "                               '*T*-184': 1,\n",
       "                               '*T*-185': 1,\n",
       "                               '*T*-186': 1,\n",
       "                               '*T*-187': 1,\n",
       "                               '*T*-188': 1,\n",
       "                               '*T*-189': 1,\n",
       "                               '*T*-19': 2,\n",
       "                               '*T*-190': 1,\n",
       "                               '*T*-191': 1,\n",
       "                               '*T*-192': 1,\n",
       "                               '*T*-193': 1,\n",
       "                               '*T*-194': 1,\n",
       "                               '*T*-195': 1,\n",
       "                               '*T*-196': 1,\n",
       "                               '*T*-197': 1,\n",
       "                               '*T*-198': 1,\n",
       "                               '*T*-199': 1,\n",
       "                               '*T*-2': 345,\n",
       "                               '*T*-20': 2,\n",
       "                               '*T*-200': 1,\n",
       "                               '*T*-201': 1,\n",
       "                               '*T*-202': 1,\n",
       "                               '*T*-203': 1,\n",
       "                               '*T*-204': 1,\n",
       "                               '*T*-205': 1,\n",
       "                               '*T*-206': 1,\n",
       "                               '*T*-207': 1,\n",
       "                               '*T*-208': 1,\n",
       "                               '*T*-21': 2,\n",
       "                               '*T*-210': 1,\n",
       "                               '*T*-211': 1,\n",
       "                               '*T*-212': 1,\n",
       "                               '*T*-213': 1,\n",
       "                               '*T*-214': 1,\n",
       "                               '*T*-215': 1,\n",
       "                               '*T*-216': 1,\n",
       "                               '*T*-217': 1,\n",
       "                               '*T*-218': 1,\n",
       "                               '*T*-219': 1,\n",
       "                               '*T*-22': 2,\n",
       "                               '*T*-220': 1,\n",
       "                               '*T*-221': 1,\n",
       "                               '*T*-222': 1,\n",
       "                               '*T*-223': 1,\n",
       "                               '*T*-224': 1,\n",
       "                               '*T*-225': 1,\n",
       "                               '*T*-226': 1,\n",
       "                               '*T*-227': 1,\n",
       "                               '*T*-228': 1,\n",
       "                               '*T*-229': 1,\n",
       "                               '*T*-23': 2,\n",
       "                               '*T*-230': 1,\n",
       "                               '*T*-231': 1,\n",
       "                               '*T*-232': 1,\n",
       "                               '*T*-233': 1,\n",
       "                               '*T*-234': 1,\n",
       "                               '*T*-235': 1,\n",
       "                               '*T*-236': 1,\n",
       "                               '*T*-237': 1,\n",
       "                               '*T*-238': 1,\n",
       "                               '*T*-239': 1,\n",
       "                               '*T*-24': 2,\n",
       "                               '*T*-240': 1,\n",
       "                               '*T*-241': 1,\n",
       "                               '*T*-242': 1,\n",
       "                               '*T*-243': 1,\n",
       "                               '*T*-244': 1,\n",
       "                               '*T*-245': 1,\n",
       "                               '*T*-246': 1,\n",
       "                               '*T*-247': 1,\n",
       "                               '*T*-248': 1,\n",
       "                               '*T*-249': 1,\n",
       "                               '*T*-25': 2,\n",
       "                               '*T*-250': 1,\n",
       "                               '*T*-251': 1,\n",
       "                               '*T*-252': 1,\n",
       "                               '*T*-253': 1,\n",
       "                               '*T*-254': 1,\n",
       "                               '*T*-255': 1,\n",
       "                               '*T*-256': 1,\n",
       "                               '*T*-257': 1,\n",
       "                               '*T*-258': 1,\n",
       "                               '*T*-259': 1,\n",
       "                               '*T*-26': 2,\n",
       "                               '*T*-260': 1,\n",
       "                               '*T*-27': 2,\n",
       "                               '*T*-28': 2,\n",
       "                               '*T*-29': 2,\n",
       "                               '*T*-3': 97,\n",
       "                               '*T*-30': 2,\n",
       "                               '*T*-31': 2,\n",
       "                               '*T*-32': 2,\n",
       "                               '*T*-33': 2,\n",
       "                               '*T*-34': 2,\n",
       "                               '*T*-35': 2,\n",
       "                               '*T*-36': 2,\n",
       "                               '*T*-37': 2,\n",
       "                               '*T*-38': 2,\n",
       "                               '*T*-39': 2,\n",
       "                               '*T*-4': 23,\n",
       "                               '*T*-40': 2,\n",
       "                               '*T*-41': 2,\n",
       "                               '*T*-42': 2,\n",
       "                               '*T*-43': 2,\n",
       "                               '*T*-44': 2,\n",
       "                               '*T*-45': 2,\n",
       "                               '*T*-46': 2,\n",
       "                               '*T*-47': 2,\n",
       "                               '*T*-48': 2,\n",
       "                               '*T*-49': 2,\n",
       "                               '*T*-5': 5,\n",
       "                               '*T*-50': 2,\n",
       "                               '*T*-51': 3,\n",
       "                               '*T*-52': 2,\n",
       "                               '*T*-53': 2,\n",
       "                               '*T*-54': 2,\n",
       "                               '*T*-55': 2,\n",
       "                               '*T*-56': 2,\n",
       "                               '*T*-57': 2,\n",
       "                               '*T*-58': 2,\n",
       "                               '*T*-59': 2,\n",
       "                               '*T*-6': 2,\n",
       "                               '*T*-60': 2,\n",
       "                               '*T*-61': 2,\n",
       "                               '*T*-62': 2,\n",
       "                               '*T*-63': 2,\n",
       "                               '*T*-64': 2,\n",
       "                               '*T*-65': 2,\n",
       "                               '*T*-66': 2,\n",
       "                               '*T*-67': 2,\n",
       "                               '*T*-68': 2,\n",
       "                               '*T*-69': 2,\n",
       "                               '*T*-7': 2,\n",
       "                               '*T*-70': 2,\n",
       "                               '*T*-71': 2,\n",
       "                               '*T*-72': 2,\n",
       "                               '*T*-73': 2,\n",
       "                               '*T*-74': 2,\n",
       "                               '*T*-75': 2,\n",
       "                               '*T*-76': 2,\n",
       "                               '*T*-77': 2,\n",
       "                               '*T*-78': 2,\n",
       "                               '*T*-79': 2,\n",
       "                               '*T*-8': 2,\n",
       "                               '*T*-80': 2,\n",
       "                               '*T*-81': 2,\n",
       "                               '*T*-82': 1,\n",
       "                               '*T*-83': 1,\n",
       "                               '*T*-84': 1,\n",
       "                               '*T*-85': 1,\n",
       "                               '*T*-86': 1,\n",
       "                               '*T*-87': 1,\n",
       "                               '*T*-88': 1,\n",
       "                               '*T*-89': 1,\n",
       "                               '*T*-9': 2,\n",
       "                               '*T*-90': 1,\n",
       "                               '*T*-91': 1,\n",
       "                               '*T*-92': 2,\n",
       "                               '*T*-93': 1,\n",
       "                               '*T*-94': 1,\n",
       "                               '*T*-95': 1,\n",
       "                               '*T*-96': 1,\n",
       "                               '*T*-97': 1,\n",
       "                               '*T*-98': 1,\n",
       "                               '*T*-99': 1,\n",
       "                               '*U*': 744,\n",
       "                               '0': 1099}),\n",
       "                     '-RRB-': FreqDist({'-RCB-': 14, '-RRB-': 112}),\n",
       "                     '.': FreqDist({'!': 6, '.': 3828, '?': 40}),\n",
       "                     ':': FreqDist({'-': 4,\n",
       "                               '--': 230,\n",
       "                               '...': 16,\n",
       "                               ':': 142,\n",
       "                               ';': 171}),\n",
       "                     'CC': FreqDist({'&': 85,\n",
       "                               'And': 44,\n",
       "                               'But': 157,\n",
       "                               'Either': 1,\n",
       "                               'Nor': 1,\n",
       "                               'Or': 3,\n",
       "                               'Yet': 4,\n",
       "                               'and': 1505,\n",
       "                               'but': 150,\n",
       "                               'either': 2,\n",
       "                               'minus': 1,\n",
       "                               'nor': 11,\n",
       "                               'or': 291,\n",
       "                               'plus': 3,\n",
       "                               'v.': 3,\n",
       "                               'versus': 1,\n",
       "                               'vs.': 1,\n",
       "                               'yet': 2}),\n",
       "                     'CD': FreqDist({\"'30s\": 1,\n",
       "                               \"'40s\": 1,\n",
       "                               \"'50s\": 1,\n",
       "                               \"'80s\": 1,\n",
       "                               \"'82\": 1,\n",
       "                               \"'86\": 1,\n",
       "                               '0.0085': 1,\n",
       "                               '0.05': 1,\n",
       "                               '0.1': 3,\n",
       "                               '0.16': 1,\n",
       "                               '0.2': 1,\n",
       "                               '0.25': 3,\n",
       "                               '0.28': 1,\n",
       "                               '0.3': 2,\n",
       "                               '0.4': 1,\n",
       "                               '0.5': 1,\n",
       "                               '0.50': 1,\n",
       "                               '0.54': 1,\n",
       "                               '0.56': 1,\n",
       "                               '0.60': 1,\n",
       "                               '0.7': 1,\n",
       "                               '0.82': 3,\n",
       "                               '0.84': 1,\n",
       "                               '0.9': 2,\n",
       "                               '0.95': 1,\n",
       "                               '0.99': 1,\n",
       "                               '1': 40,\n",
       "                               '1,000': 7,\n",
       "                               '1,050,000': 1,\n",
       "                               '1,100': 2,\n",
       "                               '1,200': 1,\n",
       "                               '1,298': 1,\n",
       "                               '1,400': 1,\n",
       "                               '1,460': 1,\n",
       "                               '1,500': 3,\n",
       "                               '1,570': 1,\n",
       "                               '1,620': 1,\n",
       "                               '1,880': 1,\n",
       "                               '1.01': 1,\n",
       "                               '1.1': 6,\n",
       "                               '1.125': 2,\n",
       "                               '1.14': 1,\n",
       "                               '1.1650': 1,\n",
       "                               '1.17': 1,\n",
       "                               '1.18': 1,\n",
       "                               '1.19': 1,\n",
       "                               '1.2': 3,\n",
       "                               '1.20': 1,\n",
       "                               '1.24': 1,\n",
       "                               '1.25': 3,\n",
       "                               '1.26': 2,\n",
       "                               '1.28': 1,\n",
       "                               '1.35': 1,\n",
       "                               '1.39': 1,\n",
       "                               '1.4': 1,\n",
       "                               '1.457': 1,\n",
       "                               '1.46': 1,\n",
       "                               '1.49': 1,\n",
       "                               '1.5': 7,\n",
       "                               '1.50': 1,\n",
       "                               '1.55': 2,\n",
       "                               '1.56': 1,\n",
       "                               '1.5755': 1,\n",
       "                               '1.5805': 1,\n",
       "                               '1.6': 3,\n",
       "                               '1.61': 1,\n",
       "                               '1.637': 1,\n",
       "                               '1.64': 2,\n",
       "                               '1.65': 3,\n",
       "                               '1.7': 2,\n",
       "                               '1.75': 1,\n",
       "                               '1.76': 2,\n",
       "                               '1.8': 2,\n",
       "                               '1.82': 1,\n",
       "                               '1.8415': 2,\n",
       "                               '1.85': 2,\n",
       "                               '1.8500': 3,\n",
       "                               '1.9': 1,\n",
       "                               '1.916': 1,\n",
       "                               '1.92': 1,\n",
       "                               '10': 51,\n",
       "                               '10,000': 18,\n",
       "                               '10-year': 1,\n",
       "                               '10.19': 1,\n",
       "                               '10.2': 3,\n",
       "                               '10.5': 1,\n",
       "                               '100': 40,\n",
       "                               '100,000': 6,\n",
       "                               '100,980': 1,\n",
       "                               '101': 2,\n",
       "                               '102': 2,\n",
       "                               '103': 1,\n",
       "                               '105': 1,\n",
       "                               '106': 1,\n",
       "                               '107': 2,\n",
       "                               '107.03': 1,\n",
       "                               '107.9': 1,\n",
       "                               '108': 1,\n",
       "                               '109.73': 1,\n",
       "                               '11': 17,\n",
       "                               '11,000': 2,\n",
       "                               '11,390,000': 1,\n",
       "                               '11,762': 1,\n",
       "                               '11.10': 1,\n",
       "                               '11.5': 1,\n",
       "                               '11.57': 1,\n",
       "                               '11.6': 1,\n",
       "                               '11.72': 1,\n",
       "                               '11.95': 1,\n",
       "                               '110': 1,\n",
       "                               '111': 2,\n",
       "                               '112.9': 1,\n",
       "                               '113.2': 1,\n",
       "                               '114': 1,\n",
       "                               '115': 2,\n",
       "                               '116.3': 1,\n",
       "                               '116.4': 1,\n",
       "                               '116.7': 1,\n",
       "                               '116.9': 1,\n",
       "                               '118': 2,\n",
       "                               '118.6': 1,\n",
       "                               '119': 1,\n",
       "                               '11\\\\/16': 1,\n",
       "                               '12': 23,\n",
       "                               '12,252': 1,\n",
       "                               '12.09': 1,\n",
       "                               '12.5': 6,\n",
       "                               '12.52': 1,\n",
       "                               '12.68': 1,\n",
       "                               '12.7': 1,\n",
       "                               '12.82': 1,\n",
       "                               '12.97': 1,\n",
       "                               '120': 6,\n",
       "                               '120,000': 1,\n",
       "                               '120.7': 1,\n",
       "                               '1206.26': 1,\n",
       "                               '121.6': 1,\n",
       "                               '125': 4,\n",
       "                               '126,000': 1,\n",
       "                               '126.1': 1,\n",
       "                               '126.15': 1,\n",
       "                               '127.03': 1,\n",
       "                               '128': 1,\n",
       "                               '129.91': 1,\n",
       "                               '12\\\\/32': 1,\n",
       "                               '13': 26,\n",
       "                               '13,056': 1,\n",
       "                               '13.1': 1,\n",
       "                               '13.15': 1,\n",
       "                               '13.5': 1,\n",
       "                               '13.50': 1,\n",
       "                               '13.625': 1,\n",
       "                               '13.65': 2,\n",
       "                               '13.73': 1,\n",
       "                               '13.8': 3,\n",
       "                               '13.90': 1,\n",
       "                               '130': 10,\n",
       "                               '130.6': 1,\n",
       "                               '130.7': 1,\n",
       "                               '131.01': 1,\n",
       "                               '132': 1,\n",
       "                               '132,000': 1,\n",
       "                               '132.9': 1,\n",
       "                               '133': 1,\n",
       "                               '133.7': 1,\n",
       "                               '133.8': 1,\n",
       "                               '135': 1,\n",
       "                               '138': 1,\n",
       "                               '139': 1,\n",
       "                               '13\\\\/16': 1,\n",
       "                               '14': 12,\n",
       "                               '14,821': 1,\n",
       "                               '14.': 1,\n",
       "                               '14.00': 1,\n",
       "                               '14.13': 1,\n",
       "                               '14.26': 1,\n",
       "                               '14.28': 1,\n",
       "                               '14.43': 1,\n",
       "                               '14.5': 1,\n",
       "                               '14.53': 1,\n",
       "                               '14.54': 1,\n",
       "                               '14.6': 1,\n",
       "                               '14.75': 1,\n",
       "                               '14.99': 1,\n",
       "                               '140': 3,\n",
       "                               '141.9': 1,\n",
       "                               '142.84': 1,\n",
       "                               '142.85': 2,\n",
       "                               '143.08': 1,\n",
       "                               '143.80': 3,\n",
       "                               '143.93': 1,\n",
       "                               '144': 1,\n",
       "                               '145': 2,\n",
       "                               '148': 1,\n",
       "                               '148.9': 1,\n",
       "                               '149': 1,\n",
       "                               '149.9': 1,\n",
       "                               '14\\\\/32': 1,\n",
       "                               '15': 42,\n",
       "                               '15,000': 21,\n",
       "                               '15.5': 1,\n",
       "                               '150': 6,\n",
       "                               '150,000': 1,\n",
       "                               '150.00': 1,\n",
       "                               '152,000': 1,\n",
       "                               '153.3': 1,\n",
       "                               '154,240,000': 2,\n",
       "                               '154.2': 1,\n",
       "                               '155': 2,\n",
       "                               '158,666': 1,\n",
       "                               '16': 12,\n",
       "                               '16,000': 2,\n",
       "                               '16,072': 1,\n",
       "                               '16.05': 1,\n",
       "                               '16.09': 1,\n",
       "                               '16.125': 1,\n",
       "                               '16.2': 1,\n",
       "                               '16.5': 1,\n",
       "                               '16.68': 1,\n",
       "                               '16.7': 3,\n",
       "                               '16.9': 1,\n",
       "                               '160': 1,\n",
       "                               '1614': 1,\n",
       "                               '1637': 1,\n",
       "                               '169.9': 1,\n",
       "                               '16\\\\/32': 1,\n",
       "                               '17': 15,\n",
       "                               '17.3': 3,\n",
       "                               '17.4': 1,\n",
       "                               '17.5': 1,\n",
       "                               '17.95': 2,\n",
       "                               '170': 1,\n",
       "                               '170,000': 1,\n",
       "                               '170,262': 1,\n",
       "                               '1738.1': 1,\n",
       "                               '175': 2,\n",
       "                               '176': 1,\n",
       "                               '176.1': 1,\n",
       "                               '177': 2,\n",
       "                               '1787': 1,\n",
       "                               '179': 2,\n",
       "                               '18': 18,\n",
       "                               '18,000': 2,\n",
       "                               '18,444': 1,\n",
       "                               '18.3': 1,\n",
       "                               '18.6': 1,\n",
       "                               '18.95': 1,\n",
       "                               '180': 5,\n",
       "                               '184': 1,\n",
       "                               '185.9': 1,\n",
       "                               '187': 1,\n",
       "                               '188': 2,\n",
       "                               '188.84': 1,\n",
       "                               '19': 8,\n",
       "                               '19.3': 1,\n",
       "                               '19.50': 1,\n",
       "                               '19.6': 2,\n",
       "                               '19.94': 1,\n",
       "                               '19.95': 1,\n",
       "                               '190': 2,\n",
       "                               '1901': 1,\n",
       "                               '1903': 1,\n",
       "                               '191.9': 1,\n",
       "                               '1917': 1,\n",
       "                               '1920s': 1,\n",
       "                               '1925': 1,\n",
       "                               '1928-33': 1,\n",
       "                               '1929': 3,\n",
       "                               '1933': 1,\n",
       "                               '1934': 1,\n",
       "                               '1937-40': 1,\n",
       "                               '1940s': 1,\n",
       "                               '1948': 2,\n",
       "                               '195': 3,\n",
       "                               '1950s': 2,\n",
       "                               '1953': 1,\n",
       "                               '1955': 1,\n",
       "                               '1956': 2,\n",
       "                               '1960s': 2,\n",
       "                               '1961': 1,\n",
       "                               '1965': 2,\n",
       "                               '1966': 1,\n",
       "                               '1967': 1,\n",
       "                               '1968': 1,\n",
       "                               '1969': 1,\n",
       "                               '1970': 4,\n",
       "                               '1970s': 2,\n",
       "                               '1971': 2,\n",
       "                               '1972': 4,\n",
       "                               '1973': 1,\n",
       "                               '1973-75': 1,\n",
       "                               '1975': 3,\n",
       "                               '1976': 5,\n",
       "                               '1977': 6,\n",
       "                               '1979': 6,\n",
       "                               '198': 1,\n",
       "                               '1980': 1,\n",
       "                               '1980s': 4,\n",
       "                               '1981': 4,\n",
       "                               '1982': 5,\n",
       "                               '1983': 5,\n",
       "                               '1983-85': 1,\n",
       "                               '1984': 8,\n",
       "                               '1985': 17,\n",
       "                               '1986': 10,\n",
       "                               '1986-87': 1,\n",
       "                               '1987': 32,\n",
       "                               '1987-88': 1,\n",
       "                               '1988': 45,\n",
       "                               '1988-89': 1,\n",
       "                               '1989': 40,\n",
       "                               '1989-90': 3,\n",
       "                               '1990': 43,\n",
       "                               '1990-91': 1,\n",
       "                               '1990s': 1,\n",
       "                               '1991': 18,\n",
       "                               '1991-1999': 1,\n",
       "                               '1991-2000': 1,\n",
       "                               '1992': 8,\n",
       "                               '1992-1999': 1,\n",
       "                               '1993': 5,\n",
       "                               '1994': 3,\n",
       "                               '1995': 1,\n",
       "                               '1996': 1,\n",
       "                               '1997': 1,\n",
       "                               '1998': 1,\n",
       "                               '1999': 5,\n",
       "                               '1:30': 1,\n",
       "                               '1\\\\/2': 27,\n",
       "                               '1\\\\/4': 12,\n",
       "                               '1\\\\/8': 11,\n",
       "                               '1st': 1,\n",
       "                               '2': 27,\n",
       "                               '2,000': 3,\n",
       "                               '2,099': 1,\n",
       "                               '2,303,328': 1,\n",
       "                               '2,410': 1,\n",
       "                               '2,500': 4,\n",
       "                               '2,700': 1,\n",
       "                               '2-3': 1,\n",
       "                               '2-8': 1,\n",
       "                               '2.07': 1,\n",
       "                               '2.1': 3,\n",
       "                               '2.15': 1,\n",
       "                               '2.19': 1,\n",
       "                               '2.2': 4,\n",
       "                               '2.25': 1,\n",
       "                               '2.29': 1,\n",
       "                               '2.3': 3,\n",
       "                               '2.30': 1,\n",
       "                               '2.35': 1,\n",
       "                               '2.375': 1,\n",
       "                               '2.4': 2,\n",
       "                               '2.42': 1,\n",
       "                               '2.44': 1,\n",
       "                               '2.46': 1,\n",
       "                               '2.47': 1,\n",
       "                               '2.5': 4,\n",
       "                               '2.50': 4,\n",
       "                               '2.6': 2,\n",
       "                               '2.62': 1,\n",
       "                               '2.65': 1,\n",
       "                               '2.7': 3,\n",
       "                               '2.75': 1,\n",
       "                               '2.8': 3,\n",
       "                               '2.80': 1,\n",
       "                               '2.87': 2,\n",
       "                               '2.875': 1,\n",
       "                               '2.9': 2,\n",
       "                               '2.95': 1,\n",
       "                               '20': 25,\n",
       "                               '20,000': 5,\n",
       "                               '20.07': 1,\n",
       "                               '20.5': 1,\n",
       "                               '200': 11,\n",
       "                               '200,000': 2,\n",
       "                               '2000': 2,\n",
       "                               '2003\\\\/2007': 1,\n",
       "                               '2005': 2,\n",
       "                               '2009': 9,\n",
       "                               '2017': 2,\n",
       "                               '2019': 6,\n",
       "                               '2029': 3,\n",
       "                               '203': 2,\n",
       "                               '20s': 1,\n",
       "                               '21': 12,\n",
       "                               '21,000': 1,\n",
       "                               '21.1': 1,\n",
       "                               '21.9': 1,\n",
       "                               '210': 1,\n",
       "                               '210,000': 1,\n",
       "                               '212': 1,\n",
       "                               '214': 1,\n",
       "                               '2141.7': 1,\n",
       "                               '2160.1': 1,\n",
       "                               '2163.2': 1,\n",
       "                               '22': 4,\n",
       "                               '22.75': 1,\n",
       "                               '220': 1,\n",
       "                               '220.45': 1,\n",
       "                               '221.4': 1,\n",
       "                               '225': 2,\n",
       "                               '225,000': 1,\n",
       "                               '225.6': 1,\n",
       "                               '226,570,380': 1,\n",
       "                               '227': 1,\n",
       "                               '228': 2,\n",
       "                               '22\\\\/32': 3,\n",
       "                               '23': 8,\n",
       "                               '23,000': 1,\n",
       "                               '23,403': 1,\n",
       "                               '23.25': 1,\n",
       "                               '23.4': 1,\n",
       "                               '23.5': 4,\n",
       "                               '23.72': 1,\n",
       "                               '230-215': 1,\n",
       "                               '234.4': 1,\n",
       "                               '235': 1,\n",
       "                               '236.74': 1,\n",
       "                               '236.79': 1,\n",
       "                               '24': 9,\n",
       "                               '24,000': 1,\n",
       "                               '24.95': 1,\n",
       "                               '240': 2,\n",
       "                               '240,000': 1,\n",
       "                               '241': 1,\n",
       "                               '244,000': 1,\n",
       "                               '245': 1,\n",
       "                               '25': 13,\n",
       "                               '25,000': 5,\n",
       "                               '25.50': 1,\n",
       "                               '25.6': 1,\n",
       "                               '250': 7,\n",
       "                               '250,000': 1,\n",
       "                               '251.2': 1,\n",
       "                               '257': 1,\n",
       "                               '26': 2,\n",
       "                               '26,000': 1,\n",
       "                               '26,956': 1,\n",
       "                               '26.2': 1,\n",
       "                               '26.5': 1,\n",
       "                               '26.8': 2,\n",
       "                               '260': 1,\n",
       "                               '263.07': 1,\n",
       "                               '2645.90': 3,\n",
       "                               '266': 1,\n",
       "                               '2691.19': 1,\n",
       "                               '27': 5,\n",
       "                               '27.1': 1,\n",
       "                               '27.4': 1,\n",
       "                               '270': 2,\n",
       "                               '271,124': 1,\n",
       "                               '271-147': 1,\n",
       "                               '273.5': 1,\n",
       "                               '274': 1,\n",
       "                               '275': 1,\n",
       "                               '278.7': 1,\n",
       "                               '28': 4,\n",
       "                               '28.25': 1,\n",
       "                               '28.36': 1,\n",
       "                               '28.4': 1,\n",
       "                               '28.5': 1,\n",
       "                               '28.53': 1,\n",
       "                               '28.6': 1,\n",
       "                               '280': 1,\n",
       "                               '282': 1,\n",
       "                               '286': 1,\n",
       "                               '29': 5,\n",
       "                               '29.3': 1,\n",
       "                               '29.4': 1,\n",
       "                               '29.9': 1,\n",
       "                               '292.32': 1,\n",
       "                               '295': 1,\n",
       "                               '2\\\\/32': 3,\n",
       "                               '3': 17,\n",
       "                               '3,040,000': 1,\n",
       "                               '3,250,000': 1,\n",
       "                               '3,288,453': 1,\n",
       "                               '3,500': 2,\n",
       "                               '3,600': 1,\n",
       "                               '3-4': 1,\n",
       "                               '3.01': 1,\n",
       "                               '3.04': 1,\n",
       "                               '3.1': 5,\n",
       "                               '3.16': 1,\n",
       "                               '3.18': 3,\n",
       "                               '3.19': 1,\n",
       "                               '3.2': 4,\n",
       "                               '3.20': 1,\n",
       "                               '3.23': 1,\n",
       "                               '3.253': 1,\n",
       "                               '3.28': 1,\n",
       "                               '3.3': 3,\n",
       "                               '3.35': 2,\n",
       "                               '3.375': 2,\n",
       "                               '3.4': 1,\n",
       "                               '3.42': 1,\n",
       "                               '3.43': 1,\n",
       "                               '3.5': 3,\n",
       "                               '3.55': 1,\n",
       "                               '3.6': 2,\n",
       "                               '3.61': 1,\n",
       "                               '3.625': 1,\n",
       "                               '3.7': 4,\n",
       "                               '3.75': 2,\n",
       "                               '3.8': 4,\n",
       "                               '3.80': 1,\n",
       "                               '3.9': 2,\n",
       "                               '30': 47,\n",
       "                               '30,000': 4,\n",
       "                               '30,537': 1,\n",
       "                               '30,841': 1,\n",
       "                               '30.6': 1,\n",
       "                               '30.9': 1,\n",
       "                               '300': 9,\n",
       "                               '300,000': 1,\n",
       "                               '300-113': 1,\n",
       "                               '301': 1,\n",
       "                               '3057': 1,\n",
       "                               '306': 1,\n",
       "                               '30s': 1,\n",
       "                               '31': 16,\n",
       "                               '310': 2,\n",
       "                               '313': 1,\n",
       "                               '319.75': 1,\n",
       "                               '32': 4,\n",
       "                               '32.8': 1,\n",
       "                               '320': 1,\n",
       "                               '321': 1,\n",
       "                               '321,000': 1,\n",
       "                               '325,000': 1,\n",
       "                               '326': 1,\n",
       "                               '33': 7,\n",
       "                               '331,000': 1,\n",
       "                               '334.5': 1,\n",
       "                               '339': 1,\n",
       "                               '34': 2,\n",
       "                               '34.625': 1,\n",
       "                               '340,000': 1,\n",
       "                               '341.20': 1,\n",
       "                               '343': 1,\n",
       "                               '3436.58': 1,\n",
       "                               '35': 7,\n",
       "                               '35.2': 1,\n",
       "                               '35.7': 2,\n",
       "                               '350': 1,\n",
       "                               '350,000': 2,\n",
       "                               '352.7': 1,\n",
       "                               '352.9': 1,\n",
       "                               '353': 1,\n",
       "                               '35500.64': 1,\n",
       "                               '35564.43': 1,\n",
       "                               '36': 1,\n",
       "                               '36.9': 1,\n",
       "                               '360': 1,\n",
       "                               '361,376': 1,\n",
       "                               '361.8': 1,\n",
       "                               '3648.82': 1,\n",
       "                               '37': 3,\n",
       "                               '37.3': 1,\n",
       "                               '37.5': 2,\n",
       "                               '370': 1,\n",
       "                               '372.14': 1,\n",
       "                               '372.9': 1,\n",
       "                               '374.19': 1,\n",
       "                               '374.20': 1,\n",
       "                               '377.60': 1,\n",
       "                               '38': 2,\n",
       "                               '38.3': 1,\n",
       "                               '38.375': 1,\n",
       "                               '38.5': 1,\n",
       "                               '38.875': 1,\n",
       "                               '380': 1,\n",
       "                               '382-37': 1,\n",
       "                               '386': 2,\n",
       "                               '387.8': 1,\n",
       "                               '388': 1,\n",
       "                               '39': 2,\n",
       "                               '396,000': 1,\n",
       "                               '397': 1,\n",
       "                               '3:15': 1,\n",
       "                               '3\\\\/4': 28,\n",
       "                               '3\\\\/8': 15,\n",
       "                               '4': 15,\n",
       "                               '4,000': 2,\n",
       "                               '4,393,237': 1,\n",
       "                               '4,645': 1,\n",
       "                               '4.1': 2,\n",
       "                               '4.10': 1,\n",
       "                               '4.2': 2,\n",
       "                               '4.25': 2,\n",
       "                               '4.3': 2,\n",
       "                               '4.4': 4,\n",
       "                               '4.5': 1,\n",
       "                               '4.55': 1,\n",
       "                               '4.6': 2,\n",
       "                               '4.7': 2,\n",
       "                               '4.75': 1,\n",
       "                               '4.8': 2,\n",
       "                               '4.875': 1,\n",
       "                               '4.898': 1,\n",
       "                               '4.9': 1,\n",
       "                               '40': 24,\n",
       "                               '40,000': 1,\n",
       "                               '40.21': 1,\n",
       "                               '400': 7,\n",
       "                               '400,000': 1,\n",
       "                               '405': 1,\n",
       "                               '41': 4,\n",
       "                               '41.60': 1,\n",
       "                               '415': 1,\n",
       "                               '415.6': 1,\n",
       "                               '415.8': 1,\n",
       "                               '42': 4,\n",
       "                               '42.1': 1,\n",
       "                               '42.5': 2,\n",
       "                               '420': 1,\n",
       "                               '422.5': 1,\n",
       "                               '43': 3,\n",
       "                               '43.875': 1,\n",
       "                               '430': 1,\n",
       "                               '434.4': 1,\n",
       "                               '436.01': 1,\n",
       "                               '44': 4,\n",
       "                               '445': 1,\n",
       "                               '446.62': 1,\n",
       "                               '449.04': 1,\n",
       "                               '45': 9,\n",
       "                               '45,000': 3,\n",
       "                               '45.2': 1,\n",
       "                               '45.3': 1,\n",
       "                               '45.75': 1,\n",
       "                               '450': 4,\n",
       "                               '451': 1,\n",
       "                               '454': 1,\n",
       "                               '456.64': 1,\n",
       "                               '458': 1,\n",
       "                               '46': 4,\n",
       "                               '46.1': 1,\n",
       "                               '467': 1,\n",
       "                               '47': 5,\n",
       "                               '47.1': 1,\n",
       "                               '47.125': 2,\n",
       "                               '47.5': 1,\n",
       "                               '47.6': 3,\n",
       "                               '472': 1,\n",
       "                               '48': 4,\n",
       "                               '49': 6,\n",
       "                               '49.9': 1,\n",
       "                               '490': 1,\n",
       "                               '492': 1,\n",
       "                               '494.50': 1,\n",
       "                               '497.34': 1,\n",
       "                               '5': 18,\n",
       "                               '5,000': 12,\n",
       "                               '5,699': 1,\n",
       "                               '5.1': 1,\n",
       "                               '5.2180': 1,\n",
       "                               '5.276': 1,\n",
       "                               '5.29': 1,\n",
       "                               '5.3': 1,\n",
       "                               '5.39': 1,\n",
       "                               '5.4': 2,\n",
       "                               '5.435': 1,\n",
       "                               '5.5': 3,\n",
       "                               '5.57': 1,\n",
       "                               '5.6': 1,\n",
       "                               '5.63': 1,\n",
       "                               '5.7': 1,\n",
       "                               '5.70': 1,\n",
       "                               '5.8': 1,\n",
       "                               '5.82': 1,\n",
       "                               '5.9': 1,\n",
       "                               '5.92': 1,\n",
       "                               '50': 46,\n",
       "                               '50,000': 4,\n",
       "                               '50-50': 1,\n",
       "                               '50.1': 1,\n",
       "                               '50.38': 1,\n",
       "                               '50.45': 1,\n",
       "                               '500': 38,\n",
       "                               '500,000': 3,\n",
       "                               '500,004': 1,\n",
       "                               '501': 1,\n",
       "                               '50\\\\/50': 1,\n",
       "                               '51': 7,\n",
       "                               '51.25': 1,\n",
       "                               '51.6': 1,\n",
       "                               '512': 1,\n",
       "                               '52': 3,\n",
       "                               '53': 4,\n",
       "                               '534': 1,\n",
       "                               '54': 1,\n",
       "                               '55': 10,\n",
       "                               '55.1': 1,\n",
       "                               '550,000': 1,\n",
       "                               '56': 1,\n",
       "                               '566.54': 1,\n",
       "                               '57': 2,\n",
       "                               '57.50': 2,\n",
       "                               '57.6': 1,\n",
       "                               '57.7': 1,\n",
       "                               '570': 1,\n",
       "                               '576': 1,\n",
       "                               '58': 4,\n",
       "                               '58.64': 1,\n",
       "                               '59': 6,\n",
       "                               '59.6': 1,\n",
       "                               '59.9': 2,\n",
       "                               '598': 1,\n",
       "                               '5\\\\/8': 13,\n",
       "                               '6': 17,\n",
       "                               '6,000': 2,\n",
       "                               '6,500': 1,\n",
       "                               '6,799': 1,\n",
       "                               '6.03': 1,\n",
       "                               '6.1': 2,\n",
       "                               '6.20': 3,\n",
       "                               '6.21': 1,\n",
       "                               '6.25': 2,\n",
       "                               '6.4': 1,\n",
       "                               '6.40': 3,\n",
       "                               '6.44': 1,\n",
       "                               '6.5': 2,\n",
       "                               '6.50': 1,\n",
       "                               '6.53': 1,\n",
       "                               '6.6': 2,\n",
       "                               '6.7': 1,\n",
       "                               '6.70': 1,\n",
       "                               '6.79': 2,\n",
       "                               '6.84': 1,\n",
       "                               '6.9': 2,\n",
       "                               '60': 13,\n",
       "                               '60,000': 2,\n",
       "                               '60.36': 1,\n",
       "                               '600': 3,\n",
       "                               '600,000': 2,\n",
       "                               '605': 2,\n",
       "                               '608,413': 1,\n",
       "                               '609': 1,\n",
       "                               '61': 5,\n",
       "                               '618.1': 1,\n",
       "                               '62': 7,\n",
       "                               '62.1': 1,\n",
       "                               '62.5': 2,\n",
       "                               '62.625': 1,\n",
       "                               '620': 1,\n",
       "                               '63': 5,\n",
       "                               '63.79': 1,\n",
       "                               '630.9': 1,\n",
       "                               '64': 3,\n",
       "                               '64.5': 1,\n",
       "                               '644': 2,\n",
       "                               '645,000': 2,\n",
       "                               '65': 7,\n",
       "                               '66.5': 1,\n",
       "                               '666': 1,\n",
       "                               '672': 1,\n",
       "                               '68': 2,\n",
       "                               '69': 2,\n",
       "                               '692': 1,\n",
       "                               '6\\\\/2': 1,\n",
       "                               '7': 20,\n",
       "                               '7,500': 2,\n",
       "                               '7.15': 1,\n",
       "                               '7.2': 2,\n",
       "                               '7.20': 1,\n",
       "                               '7.272': 3,\n",
       "                               '7.3': 4,\n",
       "                               '7.4': 1,\n",
       "                               '7.40': 2,\n",
       "                               '7.422': 1,\n",
       "                               '7.45': 1,\n",
       "                               '7.458': 3,\n",
       "                               '7.5': 3,\n",
       "                               '7.50': 1,\n",
       "                               '7.52': 1,\n",
       "                               '7.55': 1,\n",
       "                               '7.60': 1,\n",
       "                               '7.62': 1,\n",
       "                               '7.63': 1,\n",
       "                               '7.65': 1,\n",
       "                               '7.74': 2,\n",
       "                               '7.78': 1,\n",
       "                               '7.79': 1,\n",
       "                               '7.8': 1,\n",
       "                               '7.80': 1,\n",
       "                               '7.84': 1,\n",
       "                               '7.88': 4,\n",
       "                               '7.90': 4,\n",
       "                               '7.95': 2,\n",
       "                               '70': 13,\n",
       "                               '70.2': 1,\n",
       "                               '70.7': 2,\n",
       "                               '700': 1,\n",
       "                               '700,000': 1,\n",
       "                               '701': 1,\n",
       "                               '705.6': 1,\n",
       "                               '71': 3,\n",
       "                               '71,309': 1,\n",
       "                               '72': 2,\n",
       "                               '72.7': 1,\n",
       "                               '721': 1,\n",
       "                               '722': 1,\n",
       "                               '73': 2,\n",
       "                               '730': 1,\n",
       "                               '734.9': 1,\n",
       "                               '737.5': 1,\n",
       "                               '75': 8,\n",
       "                               '75-year-old': 1,\n",
       "                               '750': 3,\n",
       "                               '750,000': 2,\n",
       "                               '753': 1,\n",
       "                               '76': 1,\n",
       "                               '767': 3,\n",
       "                               '77': 2,\n",
       "                               '77,000': 1,\n",
       "                               '77.56': 1,\n",
       "                               '77.6': 1,\n",
       "                               '77.70': 1,\n",
       "                               '777': 1,\n",
       "                               '778': 1,\n",
       "                               '78': 1,\n",
       "                               '79': 1,\n",
       "                               '7\\\\/16': 2,\n",
       "                               '7\\\\/8': 13,\n",
       "                               '8': 36,\n",
       "                               '8.04': 2,\n",
       "                               '8.06': 1,\n",
       "                               '8.07': 2,\n",
       "                               '8.1': 2,\n",
       "                               '8.12': 1,\n",
       "                               '8.14': 1,\n",
       "                               '8.15': 1,\n",
       "                               '8.19': 1,\n",
       "                               '8.2': 1,\n",
       "                               '8.22': 1,\n",
       "                               '8.25': 2,\n",
       "                               '8.30': 1,\n",
       "                               '8.35': 1,\n",
       "                               '8.45': 2,\n",
       "                               '8.467': 1,\n",
       "                               '8.47': 2,\n",
       "                               '8.48': 1,\n",
       "                               '8.5': 3,\n",
       "                               '8.50': 3,\n",
       "                               '8.53': 1,\n",
       "                               '8.55': 2,\n",
       "                               '8.56': 1,\n",
       "                               '8.575': 1,\n",
       "                               '8.60': 1,\n",
       "                               '8.64': 1,\n",
       "                               '8.65': 1,\n",
       "                               '8.70': 1,\n",
       "                               '8.75': 1,\n",
       "                               '8.9': 2,\n",
       "                               '80': 7,\n",
       "                               '80.50': 1,\n",
       "                               '80.8': 1,\n",
       "                               '800': 3,\n",
       "                               '81.8': 1,\n",
       "                               '811.9': 1,\n",
       "                               '82,389': 1,\n",
       "                               '83': 1,\n",
       "                               '83,206': 1,\n",
       "                               '83.4': 1,\n",
       "                               '830,000': 1,\n",
       "                               '8300': 1,\n",
       "                               '84.29': 1,\n",
       "                               '84.9': 1,\n",
       "                               '847': 2,\n",
       "                               '85': 4,\n",
       "                               '85.1': 1,\n",
       "                               '85.7': 1,\n",
       "                               '850': 1,\n",
       "                               '858,000': 1,\n",
       "                               '86': 1,\n",
       "                               '86.12': 1,\n",
       "                               '87.5': 1,\n",
       "                               '877,663': 1,\n",
       "                               '879': 1,\n",
       "                               '88': 2,\n",
       "                               '88.32': 1,\n",
       "                               '89': 2,\n",
       "                               '89,500': 1,\n",
       "                               '89.7': 1,\n",
       "                               '89.9': 2,\n",
       "                               '890': 1,\n",
       "                               '9': 18,\n",
       "                               '9,118': 1,\n",
       "                               '9.3': 1,\n",
       "                               '9.32': 1,\n",
       "                               '9.37': 1,\n",
       "                               '9.45': 1,\n",
       "                               '9.5': 2,\n",
       "                               '9.625': 1,\n",
       "                               '9.75': 1,\n",
       "                               '9.8': 2,\n",
       "                               '9.82': 1,\n",
       "                               '9.9': 3,\n",
       "                               '90': 13,\n",
       "                               '900': 8,\n",
       "                               '909': 1,\n",
       "                               '913': 1,\n",
       "                               '917': 1,\n",
       "                               '92': 1,\n",
       "                               '92.9': 1,\n",
       "                               '93': 1,\n",
       "                               '93,000': 1,\n",
       "                               '93.3': 1,\n",
       "                               '93.9': 1,\n",
       "                               '94': 1,\n",
       "                               '94.2': 1,\n",
       "                               '94.8': 1,\n",
       "                               '95': 1,\n",
       "                               '95,142': 1,\n",
       "                               '95.09': 1,\n",
       "                               '96.4': 1,\n",
       "                               '960': 1,\n",
       "                               '963': 1,\n",
       "                               '967,809': 1,\n",
       "                               '98': 4,\n",
       "                               '98.3': 1,\n",
       "                               '99': 5,\n",
       "                               '99.1': 1,\n",
       "                               '99.3': 1,\n",
       "                               '992,000': 1,\n",
       "                               '9\\\\/32': 1,\n",
       "                               'Cray-3': 1,\n",
       "                               'FIRST': 1,\n",
       "                               'Fifteen': 1,\n",
       "                               'Five': 1,\n",
       "                               'Four': 1,\n",
       "                               'Fourteen': 1,\n",
       "                               'IX': 1,\n",
       "                               'Nine': 1,\n",
       "                               'One': 19,\n",
       "                               'Sept.30': 1,\n",
       "                               'THREE': 1,\n",
       "                               'TWO': 1,\n",
       "                               'Ten': 1,\n",
       "                               'Three': 2,\n",
       "                               'Two': 5,\n",
       "                               'billion': 159,\n",
       "                               'eight': 4,\n",
       "                               'five': 29,\n",
       "                               'four': 20,\n",
       "                               'hundred': 3,\n",
       "                               'mid-1970s': 1,\n",
       "                               'million': 383,\n",
       "                               'nine': 12,\n",
       "                               'one': 121,\n",
       "                               'seven': 9,\n",
       "                               'six': 31,\n",
       "                               'the': 1,\n",
       "                               'thousand': 1,\n",
       "                               'three': 48,\n",
       "                               'trillion': 5,\n",
       "                               'two': 103,\n",
       "                               'zero': 1}),\n",
       "                     'DT': FreqDist({'A': 105,\n",
       "                               'AN': 1,\n",
       "                               'All': 12,\n",
       "                               'An': 18,\n",
       "                               'Another': 6,\n",
       "                               'Any': 3,\n",
       "                               'Both': 9,\n",
       "                               'Each': 9,\n",
       "                               'Every': 2,\n",
       "                               'Neither': 5,\n",
       "                               'No': 10,\n",
       "                               'Some': 22,\n",
       "                               'THE': 2,\n",
       "                               'That': 37,\n",
       "                               'The': 713,\n",
       "                               'These': 22,\n",
       "                               'This': 40,\n",
       "                               'Those': 6,\n",
       "                               'a': 1874,\n",
       "                               'all': 86,\n",
       "                               'an': 316,\n",
       "                               'another': 42,\n",
       "                               'any': 103,\n",
       "                               'both': 34,\n",
       "                               'del': 1,\n",
       "                               'each': 37,\n",
       "                               'either': 5,\n",
       "                               'every': 19,\n",
       "                               'half': 10,\n",
       "                               'la': 1,\n",
       "                               'le': 1,\n",
       "                               'neither': 7,\n",
       "                               'no': 76,\n",
       "                               'some': 122,\n",
       "                               'that': 77,\n",
       "                               'the': 4038,\n",
       "                               'these': 55,\n",
       "                               'this': 184,\n",
       "                               'those': 55}),\n",
       "                     'EX': FreqDist({'There': 32, 'there': 56}),\n",
       "                     'FW': FreqDist({'Perestroika': 1,\n",
       "                               'besuboru': 1,\n",
       "                               'de': 1,\n",
       "                               'etc.': 1}),\n",
       "                     'IN': FreqDist({'@': 1,\n",
       "                               'About': 6,\n",
       "                               'Above': 1,\n",
       "                               'After': 10,\n",
       "                               'Against': 1,\n",
       "                               'Along': 2,\n",
       "                               'Although': 14,\n",
       "                               'Among': 13,\n",
       "                               'As': 29,\n",
       "                               'At': 28,\n",
       "                               'Because': 6,\n",
       "                               'Before': 2,\n",
       "                               'Behind': 1,\n",
       "                               'Besides': 4,\n",
       "                               'But': 1,\n",
       "                               'By': 11,\n",
       "                               'Despite': 11,\n",
       "                               'During': 5,\n",
       "                               'Except': 1,\n",
       "                               'For': 36,\n",
       "                               'From': 5,\n",
       "                               'If': 40,\n",
       "                               'In': 195,\n",
       "                               'Like': 5,\n",
       "                               'OF': 2,\n",
       "                               'OVER': 1,\n",
       "                               'Of': 4,\n",
       "                               'On': 17,\n",
       "                               'Once': 1,\n",
       "                               'Over': 2,\n",
       "                               'Since': 6,\n",
       "                               'So': 11,\n",
       "                               'Than': 1,\n",
       "                               'That': 1,\n",
       "                               'Though': 1,\n",
       "                               'Under': 14,\n",
       "                               'Unless': 1,\n",
       "                               'Unlike': 3,\n",
       "                               'Until': 5,\n",
       "                               'Whereas': 1,\n",
       "                               'Whether': 1,\n",
       "                               'While': 25,\n",
       "                               'With': 11,\n",
       "                               'Without': 6,\n",
       "                               'a': 1,\n",
       "                               'aboard': 1,\n",
       "                               'about': 176,\n",
       "                               'above': 15,\n",
       "                               'across': 14,\n",
       "                               'after': 77,\n",
       "                               'against': 34,\n",
       "                               'ago': 22,\n",
       "                               'along': 6,\n",
       "                               'although': 13,\n",
       "                               'amid': 4,\n",
       "                               'among': 31,\n",
       "                               'and': 1,\n",
       "                               'are': 1,\n",
       "                               'around': 24,\n",
       "                               'as': 333,\n",
       "                               'at': 402,\n",
       "                               'because': 116,\n",
       "                               'before': 42,\n",
       "                               'behind': 4,\n",
       "                               'below': 32,\n",
       "                               'between': 36,\n",
       "                               'beyond': 4,\n",
       "                               'by': 427,\n",
       "                               'complicated': 1,\n",
       "                               'de': 5,\n",
       "                               'despite': 14,\n",
       "                               'down': 19,\n",
       "                               'during': 38,\n",
       "                               'except': 7,\n",
       "                               'far': 1,\n",
       "                               'for': 815,\n",
       "                               'from': 386,\n",
       "                               'if': 80,\n",
       "                               'in': 1554,\n",
       "                               'including': 1,\n",
       "                               'into': 87,\n",
       "                               'like': 44,\n",
       "                               'near': 8,\n",
       "                               'next': 9,\n",
       "                               'notwithstanding': 1,\n",
       "                               'of': 2319,\n",
       "                               'off': 12,\n",
       "                               'on': 483,\n",
       "                               'once': 1,\n",
       "                               'onto': 2,\n",
       "                               'out': 28,\n",
       "                               'outside': 4,\n",
       "                               'over': 72,\n",
       "                               'per': 9,\n",
       "                               'since': 50,\n",
       "                               'so': 16,\n",
       "                               'than': 180,\n",
       "                               'that': 513,\n",
       "                               'though': 25,\n",
       "                               'through': 41,\n",
       "                               'throughout': 5,\n",
       "                               'till': 1,\n",
       "                               'to': 2,\n",
       "                               'toward': 5,\n",
       "                               'under': 60,\n",
       "                               'unless': 9,\n",
       "                               'unlike': 2,\n",
       "                               'until': 31,\n",
       "                               'up': 27,\n",
       "                               'upon': 8,\n",
       "                               'via': 15,\n",
       "                               'vs.': 1,\n",
       "                               'whether': 28,\n",
       "                               'which': 1,\n",
       "                               'while': 47,\n",
       "                               'with': 387,\n",
       "                               'within': 13,\n",
       "                               'without': 29,\n",
       "                               'worth': 3}),\n",
       "                     'JJ': FreqDist({'old': 24,\n",
       "                               'nonexecutive': 5,\n",
       "                               'former': 19,\n",
       "                               'British': 7,\n",
       "                               'industrial': 18,\n",
       "                               'high': 26,\n",
       "                               'resilient': 1,\n",
       "                               'brief': 4,\n",
       "                               'later': 11,\n",
       "                               'New': 6,\n",
       "                               'York-based': 4,\n",
       "                               'preliminary': 5,\n",
       "                               'likely': 20,\n",
       "                               'new': 162,\n",
       "                               'questionable': 3,\n",
       "                               'aware': 3,\n",
       "                               'useful': 2,\n",
       "                               'medical': 7,\n",
       "                               'modest': 3,\n",
       "                               'early': 29,\n",
       "                               'different': 21,\n",
       "                               'more': 1,\n",
       "                               'asbestos-related': 3,\n",
       "                               'malignant': 1,\n",
       "                               'striking': 2,\n",
       "                               'Western': 6,\n",
       "                               'common': 54,\n",
       "                               'other': 134,\n",
       "                               'few': 33,\n",
       "                               'smooth': 1,\n",
       "                               'needle-like': 1,\n",
       "                               'such': 82,\n",
       "                               'curly': 1,\n",
       "                               'gradual': 1,\n",
       "                               'cancer-causing': 1,\n",
       "                               'dusty': 1,\n",
       "                               'large': 29,\n",
       "                               'huge': 14,\n",
       "                               'dry': 4,\n",
       "                               'blue': 5,\n",
       "                               'human': 4,\n",
       "                               'money-market': 3,\n",
       "                               'mutual': 8,\n",
       "                               'further': 10,\n",
       "                               'average': 22,\n",
       "                               'seven-day': 3,\n",
       "                               'taxable': 2,\n",
       "                               'current': 30,\n",
       "                               'Average': 4,\n",
       "                               'open': 7,\n",
       "                               'recent': 72,\n",
       "                               'short-term': 14,\n",
       "                               'six-month': 6,\n",
       "                               'comparable': 3,\n",
       "                               'top': 10,\n",
       "                               'top-yielding': 1,\n",
       "                               'dollar-denominated': 3,\n",
       "                               'simple': 4,\n",
       "                               '30-day': 8,\n",
       "                               'energy-services': 1,\n",
       "                               'regulatory': 8,\n",
       "                               'Italian': 4,\n",
       "                               'state-owned': 2,\n",
       "                               'mechanical': 4,\n",
       "                               'computerized': 1,\n",
       "                               'annual': 17,\n",
       "                               'federal': 51,\n",
       "                               'capital-gains': 1,\n",
       "                               'next': 58,\n",
       "                               'senior': 18,\n",
       "                               'general': 19,\n",
       "                               'Japanese': 80,\n",
       "                               'biannual': 1,\n",
       "                               'sunny': 1,\n",
       "                               'corporate': 25,\n",
       "                               'rusty': 1,\n",
       "                               'good': 40,\n",
       "                               'unimpeded': 1,\n",
       "                               'red': 2,\n",
       "                               'special': 15,\n",
       "                               'everyday': 1,\n",
       "                               'official': 3,\n",
       "                               '10-lap': 1,\n",
       "                               'chocolate': 1,\n",
       "                               'tasty': 1,\n",
       "                               'free': 13,\n",
       "                               'standing': 1,\n",
       "                               'red-carpet': 1,\n",
       "                               'future': 18,\n",
       "                               'economic': 41,\n",
       "                               'Preliminary': 1,\n",
       "                               'fifth': 7,\n",
       "                               'monthly': 7,\n",
       "                               'export-oriented': 1,\n",
       "                               'mere': 2,\n",
       "                               'last': 86,\n",
       "                               'sluggish': 8,\n",
       "                               'gloomy': 1,\n",
       "                               'same': 37,\n",
       "                               'rival': 1,\n",
       "                               'second': 14,\n",
       "                               'permanent': 2,\n",
       "                               'fierce': 2,\n",
       "                               'full': 21,\n",
       "                               'four-color': 1,\n",
       "                               'first': 66,\n",
       "                               'heavy': 5,\n",
       "                               'electronic': 6,\n",
       "                               'big': 37,\n",
       "                               'flat': 8,\n",
       "                               'potential': 12,\n",
       "                               'outside': 5,\n",
       "                               'internal': 6,\n",
       "                               'independent': 6,\n",
       "                               'chief': 10,\n",
       "                               'executive': 28,\n",
       "                               'true': 7,\n",
       "                               'substantial': 6,\n",
       "                               'persistent': 4,\n",
       "                               'long': 15,\n",
       "                               'political': 19,\n",
       "                               'financial': 42,\n",
       "                               'troubled': 5,\n",
       "                               'possible': 24,\n",
       "                               'composite': 16,\n",
       "                               '12-member': 1,\n",
       "                               'illegal': 6,\n",
       "                               'nuclear': 5,\n",
       "                               'local': 23,\n",
       "                               'electric': 2,\n",
       "                               'exact': 6,\n",
       "                               'actual': 8,\n",
       "                               'past': 21,\n",
       "                               'administrative': 6,\n",
       "                               'unreasonable': 2,\n",
       "                               'subject': 8,\n",
       "                               'additional': 26,\n",
       "                               'Last': 14,\n",
       "                               'court-ordered': 1,\n",
       "                               'summer\\\\/winter': 1,\n",
       "                               'differential': 1,\n",
       "                               'poor': 5,\n",
       "                               'domestic': 13,\n",
       "                               'strong': 24,\n",
       "                               'year-to-year': 1,\n",
       "                               'previous': 19,\n",
       "                               'medium-sized': 3,\n",
       "                               'initial': 8,\n",
       "                               'product-design': 1,\n",
       "                               '64-year-old': 2,\n",
       "                               'operational': 1,\n",
       "                               'several': 32,\n",
       "                               'many': 83,\n",
       "                               'Minneapolis-based': 1,\n",
       "                               'public': 20,\n",
       "                               'worst-case': 1,\n",
       "                               'promissory': 1,\n",
       "                               'tricky': 1,\n",
       "                               'unproven': 1,\n",
       "                               'fragile': 2,\n",
       "                               'minute': 1,\n",
       "                               'robotic': 1,\n",
       "                               'intense': 5,\n",
       "                               'world-wide': 5,\n",
       "                               'direct': 7,\n",
       "                               'Big': 2,\n",
       "                               'Pro-forma': 1,\n",
       "                               'able': 16,\n",
       "                               'intellectual-property': 5,\n",
       "                               'so-called': 7,\n",
       "                               'interim': 4,\n",
       "                               'accelerated': 1,\n",
       "                               'unfair-trade': 1,\n",
       "                               'stiff': 2,\n",
       "                               'intellectual': 2,\n",
       "                               'genuine': 1,\n",
       "                               'touchy': 1,\n",
       "                               'own': 40,\n",
       "                               'inadequate': 2,\n",
       "                               'effective': 6,\n",
       "                               'search-and-seizure': 1,\n",
       "                               'bilateral': 4,\n",
       "                               'foreign': 23,\n",
       "                               'unauthorized': 1,\n",
       "                               'small': 44,\n",
       "                               'video-viewing': 1,\n",
       "                               'compatible': 1,\n",
       "                               'international': 18,\n",
       "                               'literary': 1,\n",
       "                               'lower-priority': 1,\n",
       "                               'less-serious': 1,\n",
       "                               'American': 28,\n",
       "                               'disturbing': 3,\n",
       "                               'slow': 6,\n",
       "                               'elaborate': 2,\n",
       "                               'pharmaceutical': 6,\n",
       "                               'bad': 14,\n",
       "                               'Argentine': 2,\n",
       "                               'external': 1,\n",
       "                               'significant': 14,\n",
       "                               'only': 10,\n",
       "                               'personal': 14,\n",
       "                               'crude': 4,\n",
       "                               'major': 44,\n",
       "                               'affordable': 1,\n",
       "                               'Crude': 2,\n",
       "                               'explosive': 1,\n",
       "                               'unlike': 1,\n",
       "                               'built-from-kit': 1,\n",
       "                               'Current': 2,\n",
       "                               'language-housekeeper': 1,\n",
       "                               'Australian': 2,\n",
       "                               'Jersey-based': 1,\n",
       "                               'convertible': 13,\n",
       "                               'joint': 9,\n",
       "                               'excise': 1,\n",
       "                               'buy-out': 1,\n",
       "                               'certain': 26,\n",
       "                               'non-encapsulating': 1,\n",
       "                               'duty-free': 5,\n",
       "                               'low-priced': 1,\n",
       "                               'battery-operated': 1,\n",
       "                               'main': 8,\n",
       "                               'eligible': 6,\n",
       "                               'resigned': 1,\n",
       "                               'automotive-parts': 1,\n",
       "                               'satisfactory': 2,\n",
       "                               'ambitious': 2,\n",
       "                               'excess': 3,\n",
       "                               'automotive': 5,\n",
       "                               'steady': 6,\n",
       "                               'quarterly': 5,\n",
       "                               '52-week': 1,\n",
       "                               'Canadian': 5,\n",
       "                               'influential': 2,\n",
       "                               '63-year-old': 1,\n",
       "                               'securities-based': 1,\n",
       "                               'mortgage-based': 1,\n",
       "                               'institutional': 10,\n",
       "                               'similar': 11,\n",
       "                               'mortgage-backed': 3,\n",
       "                               'seven-year': 1,\n",
       "                               'fixed-rate': 6,\n",
       "                               'floating-rate': 3,\n",
       "                               'key': 9,\n",
       "                               'First': 3,\n",
       "                               'Second': 2,\n",
       "                               'semiannual': 3,\n",
       "                               'attractive': 2,\n",
       "                               'Such': 9,\n",
       "                               'outstanding': 21,\n",
       "                               'rapid': 2,\n",
       "                               'total': 11,\n",
       "                               '54-year-old': 1,\n",
       "                               'exclusive': 4,\n",
       "                               'indirect': 1,\n",
       "                               '37-a-share': 1,\n",
       "                               'pursuant': 3,\n",
       "                               'hefty': 5,\n",
       "                               'sixth': 3,\n",
       "                               'consecutive': 5,\n",
       "                               'protracted': 2,\n",
       "                               'yen-support': 1,\n",
       "                               'closed-end': 3,\n",
       "                               'single': 10,\n",
       "                               'Washington-based': 1,\n",
       "                               'Next': 1,\n",
       "                               'Philippine': 1,\n",
       "                               'popular': 7,\n",
       "                               'traditional': 12,\n",
       "                               'open-end': 1,\n",
       "                               'one-country': 1,\n",
       "                               'available': 14,\n",
       "                               'heavy-duty': 1,\n",
       "                               'individual': 11,\n",
       "                               'easy': 10,\n",
       "                               'Financial': 2,\n",
       "                               'mature': 1,\n",
       "                               'hard': 7,\n",
       "                               'much': 30,\n",
       "                               'Political': 1,\n",
       "                               'wild': 2,\n",
       "                               'fat': 2,\n",
       "                               'underlying': 3,\n",
       "                               'late': 15,\n",
       "                               'European': 6,\n",
       "                               'startling': 2,\n",
       "                               'long-term': 14,\n",
       "                               'rich': 3,\n",
       "                               'global': 6,\n",
       "                               'foreign-stock': 1,\n",
       "                               'resistant': 1,\n",
       "                               'plenty': 1,\n",
       "                               'aghast': 1,\n",
       "                               'lofty': 1,\n",
       "                               'depositary': 1,\n",
       "                               'ready': 1,\n",
       "                               'technical': 5,\n",
       "                               'pre-Communist': 1,\n",
       "                               'Russian': 1,\n",
       "                               'Soviet': 10,\n",
       "                               'Coincident': 1,\n",
       "                               'short-lived': 1,\n",
       "                               'democratic': 3,\n",
       "                               'pre-1917': 1,\n",
       "                               'pre-1933': 1,\n",
       "                               'legal': 12,\n",
       "                               'lend-lease': 1,\n",
       "                               'separate': 9,\n",
       "                               'Private': 1,\n",
       "                               'usual': 3,\n",
       "                               'seasonal': 1,\n",
       "                               'residential': 4,\n",
       "                               'industrial-production': 1,\n",
       "                               'soft': 3,\n",
       "                               'excessive': 3,\n",
       "                               'nondurable': 1,\n",
       "                               'durable': 1,\n",
       "                               'level': 1,\n",
       "                               'unfilled': 1,\n",
       "                               'off': 2,\n",
       "                               'single-family': 1,\n",
       "                               'private': 20,\n",
       "                               'nonresidential': 1,\n",
       "                               'imminent': 5,\n",
       "                               'low': 23,\n",
       "                               'inflationary': 1,\n",
       "                               'particular': 7,\n",
       "                               'short': 11,\n",
       "                               'odd': 3,\n",
       "                               'nonfat': 1,\n",
       "                               'desultory': 1,\n",
       "                               'engaging': 1,\n",
       "                               'buttoned-down': 1,\n",
       "                               'contemporary': 4,\n",
       "                               'self-aggrandizing': 1,\n",
       "                               'we-Japanese': 1,\n",
       "                               'unique': 1,\n",
       "                               'unfathomable': 1,\n",
       "                               'implicit': 1,\n",
       "                               'nutty': 1,\n",
       "                               'imaginative': 1,\n",
       "                               'funny': 3,\n",
       "                               'disaffected': 1,\n",
       "                               'hard-drinking': 1,\n",
       "                               'nearly-30': 1,\n",
       "                               'elusive': 1,\n",
       "                               'sinister': 1,\n",
       "                               'erudite': 1,\n",
       "                               'prescient': 1,\n",
       "                               'sassy': 1,\n",
       "                               'docile': 1,\n",
       "                               'solicitous': 1,\n",
       "                               'Christian': 1,\n",
       "                               'sweet': 2,\n",
       "                               'roughhewn': 1,\n",
       "                               'a': 2,\n",
       "                               '40-year-old': 1,\n",
       "                               'fluent': 1,\n",
       "                               'youthful': 1,\n",
       "                               'idiomatic': 1,\n",
       "                               'Nipponese': 2,\n",
       "                               'fabled': 1,\n",
       "                               'important': 17,\n",
       "                               'humble': 1,\n",
       "                               'uncomplaining': 1,\n",
       "                               'obedient': 1,\n",
       "                               'male': 2,\n",
       "                               'unrecognizable': 2,\n",
       "                               'foul': 2,\n",
       "                               'even': 3,\n",
       "                               'strict': 3,\n",
       "                               'amusing': 2,\n",
       "                               'enormous': 2,\n",
       "                               'worth': 3,\n",
       "                               'petulant': 1,\n",
       "                               'impudent': 1,\n",
       "                               'supercilious': 1,\n",
       "                               'vicious': 1,\n",
       "                               'mundane': 1,\n",
       "                               'regimented': 1,\n",
       "                               'and': 3,\n",
       "                               'austere': 1,\n",
       "                               'prying': 1,\n",
       "                               'unproductive': 1,\n",
       "                               'hierarchical': 1,\n",
       "                               'assistant': 3,\n",
       "                               'chary': 1,\n",
       "                               'young': 12,\n",
       "                               'raring': 1,\n",
       "                               'social': 6,\n",
       "                               'venerable': 2,\n",
       "                               'exempt': 1,\n",
       "                               'prime': 3,\n",
       "                               'on-campus': 1,\n",
       "                               'materialistic': 2,\n",
       "                               'pressured': 3,\n",
       "                               'one-third': 1,\n",
       "                               'great': 12,\n",
       "                               'necessary': 10,\n",
       "                               'Palestinian': 1,\n",
       "                               'food-shop': 1,\n",
       "                               'chaotic': 1,\n",
       "                               'Polish': 2,\n",
       "                               'diplomatic': 1,\n",
       "                               'multibillion-dollar': 1,\n",
       "                               'Austrian': 1,\n",
       "                               'complete': 1,\n",
       "                               'environmental': 6,\n",
       "                               'Czech': 1,\n",
       "                               'Scandinavian': 1,\n",
       "                               'national': 10,\n",
       "                               'due': 38,\n",
       "                               'Toronto-based': 2,\n",
       "                               'real': 17,\n",
       "                               'Lead': 1,\n",
       "                               '36-minute': 1,\n",
       "                               'black-and-white': 1,\n",
       "                               'full-length': 1,\n",
       "                               'poignant': 1,\n",
       "                               'modern-day': 1,\n",
       "                               'homeless': 6,\n",
       "                               'silent': 2,\n",
       "                               'double': 1,\n",
       "                               'classical': 1,\n",
       "                               'exciting': 1,\n",
       "                               'eclectic': 1,\n",
       "                               'good-hearted': 1,\n",
       "                               'lovely': 1,\n",
       "                               'benign': 1,\n",
       "                               'good-natured': 1,\n",
       "                               'dead-eyed': 1,\n",
       "                               'four-year-old': 1,\n",
       "                               'carefree': 1,\n",
       "                               'blind': 2,\n",
       "                               'two-year-old': 1,\n",
       "                               'cute': 1,\n",
       "                               'serious': 12,\n",
       "                               'vagrant': 1,\n",
       "                               'far': 3,\n",
       "                               'little': 15,\n",
       "                               'improbable': 1,\n",
       "                               'expensive': 10,\n",
       "                               'high-rise': 1,\n",
       "                               'final': 8,\n",
       "                               'whimsical': 1,\n",
       "                               'enviable': 1,\n",
       "                               'rough': 2,\n",
       "                               'beaten': 1,\n",
       "                               'French': 4,\n",
       "                               'weird': 1,\n",
       "                               'harsh': 3,\n",
       "                               'brilliant': 2,\n",
       "                               'captivating': 1,\n",
       "                               'sympathetic': 2,\n",
       "                               'disagreeable': 1,\n",
       "                               'historical': 2,\n",
       "                               'diversionary': 1,\n",
       "                               'symbolic': 1,\n",
       "                               'small-time': 1,\n",
       "                               'war-rationed': 1,\n",
       "                               'untrained': 1,\n",
       "                               'botched': 1,\n",
       "                               'shallow': 1,\n",
       "                               'kind': 2,\n",
       "                               'playful': 1,\n",
       "                               'dreadful': 1,\n",
       "                               'war-damaged': 1,\n",
       "                               'thin-lipped': 1,\n",
       "                               'nice': 3,\n",
       "                               'confused': 1,\n",
       "                               'endless': 1,\n",
       "                               'bright': 2,\n",
       "                               'loose': 1,\n",
       "                               'energetic': 2,\n",
       "                               'regular': 3,\n",
       "                               'specific': 2,\n",
       "                               'combined': 1,\n",
       "                               'negative': 9,\n",
       "                               'secondary': 4,\n",
       "                               'presidential': 3,\n",
       "                               'off-off': 1,\n",
       "                               'empty': 1,\n",
       "                               'sometimes-tawdry': 1,\n",
       "                               'bold': 2,\n",
       "                               'entertaining': 1,\n",
       "                               'confrontational': 1,\n",
       "                               'truthful': 1,\n",
       "                               'principal': 5,\n",
       "                               'tight': 4,\n",
       "                               'facial': 1,\n",
       "                               'Democratic': 5,\n",
       "                               'straight': 3,\n",
       "                               'disembodied': 1,\n",
       "                               'phony': 1,\n",
       "                               'Nasty': 1,\n",
       "                               'distorted': 1,\n",
       "                               'cop-killer': 3,\n",
       "                               'pro-choice': 2,\n",
       "                               'Funny': 1,\n",
       "                               'classic': 3,\n",
       "                               'accurate': 2,\n",
       "                               'matching': 1,\n",
       "                               'incomplete': 4,\n",
       "                               'get-out-the-vote': 1,\n",
       "                               'deceptive': 1,\n",
       "                               'gubernatorial': 1,\n",
       "                               'Republican': 3,\n",
       "                               'commercial': 18,\n",
       "                               'very': 3,\n",
       "                               'unpleasant': 1,\n",
       "                               'legislative': 5,\n",
       "                               'unfounded': 1,\n",
       "                               'tired': 1,\n",
       "                               'positive': 6,\n",
       "                               'female': 4,\n",
       "                               'mean': 1,\n",
       "                               'dirty': 1,\n",
       "                               'hazardous': 2,\n",
       "                               'record': 2,\n",
       "                               'Southeast': 3,\n",
       "                               'Asian': 9,\n",
       "                               'fresh': 3,\n",
       "                               'steep': 2,\n",
       "                               'cash-rich': 1,\n",
       "                               'overseas': 7,\n",
       "                               'labor-intensive': 1,\n",
       "                               'subordinate': 1,\n",
       "                               'recipient': 2,\n",
       "                               'needed': 1,\n",
       "                               'military': 8,\n",
       "                               'fearful': 1,\n",
       "                               'U.S.-Japanese': 1,\n",
       "                               'cohesive': 1,\n",
       "                               'East': 3,\n",
       "                               'integrated': 1,\n",
       "                               'regional': 7,\n",
       "                               'crucial': 2,\n",
       "                               'difficult': 7,\n",
       "                               'enlarged': 1,\n",
       "                               'benevolent': 1,\n",
       "                               'altruistic': 1,\n",
       "                               'net': 38,\n",
       "                               'apprehensive': 1,\n",
       "                               'complicated': 4,\n",
       "                               'Many': 17,\n",
       "                               'desirable': 2,\n",
       "                               'Comprehensive': 1,\n",
       "                               'Basic': 3,\n",
       "                               'ninth': 1,\n",
       "                               'crib': 1,\n",
       "                               'uncanny': 1,\n",
       "                               'Senate-House': 1,\n",
       "                               'low-ability': 3,\n",
       "                               'overhead': 2,\n",
       "                               'unusual': 7,\n",
       "                               'guilty': 3,\n",
       "                               'unstinting': 1,\n",
       "                               'stunned': 1,\n",
       "                               'bald-faced': 1,\n",
       "                               'dark': 1,\n",
       "                               'high-stakes': 1,\n",
       "                               'school-improvement': 1,\n",
       "                               'student-test': 1,\n",
       "                               'incredible': 1,\n",
       "                               '50-state': 1,\n",
       "                               'school-research': 1,\n",
       "                               'outright': 2,\n",
       "                               'standardized': 7,\n",
       "                               'widespread': 5,\n",
       "                               'wrong': 6,\n",
       "                               'right': 5,\n",
       "                               'statewide': 2,\n",
       "                               'numerous': 6,\n",
       "                               'test-coaching': 2,\n",
       "                               'sophisticated': 5,\n",
       "                               'academic': 3,\n",
       "                               'precise': 1,\n",
       "                               'entire': 5,\n",
       "                               'wrenching': 1,\n",
       "                               'state-supervised': 1,\n",
       "                               'High': 1,\n",
       "                               'extra': 4,\n",
       "                               'primary': 4,\n",
       "                               'unfair': 10,\n",
       "                               'shaded': 1,\n",
       "                               'run-down': 2,\n",
       "                               'winning': 1,\n",
       "                               'yellow': 1,\n",
       "                               'broad': 4,\n",
       "                               'awful': 1,\n",
       "                               'seventh': 1,\n",
       "                               'immediate': 2,\n",
       "                               'nervous': 2,\n",
       "                               'disparate': 1,\n",
       "                               'split': 1,\n",
       "                               'privileged': 1,\n",
       "                               'white': 2,\n",
       "                               'monied': 1,\n",
       "                               'inner': 1,\n",
       "                               'overall': 7,\n",
       "                               'educational': 2,\n",
       "                               '37-year-old': 1,\n",
       "                               '14-hour': 1,\n",
       "                               'favorite': 2,\n",
       "                               'Encouraged': 1,\n",
       "                               'Cultural': 1,\n",
       "                               'inspirational': 1,\n",
       "                               'teacher-cadet': 1,\n",
       "                               '11th': 1,\n",
       "                               'forcing': 1,\n",
       "                               'fellow': 2,\n",
       "                               'cocky': 1,\n",
       "                               'yielding': 1,\n",
       "                               'Huge': 1,\n",
       "                               'meaningful': 2,\n",
       "                               'third': 15,\n",
       "                               'eager': 3,\n",
       "                               'if': 1,\n",
       "                               'interested': 6,\n",
       "                               'correct': 1,\n",
       "                               'whole': 2,\n",
       "                               'alive': 2,\n",
       "                               'drag-down': 1,\n",
       "                               'advanced': 2,\n",
       "                               'underprivileged': 1,\n",
       "                               'morale-damaging': 1,\n",
       "                               'quiet': 3,\n",
       "                               'dumbfounded': 1,\n",
       "                               'Supportive': 1,\n",
       "                               'first-time': 1,\n",
       "                               'worthy': 1,\n",
       "                               'crushed': 1,\n",
       "                               '17-year-old': 1,\n",
       "                               'familiar': 5,\n",
       "                               'red-and-white': 1,\n",
       "                               'angry': 2,\n",
       "                               'afraid': 3,\n",
       "                               'relieved': 1,\n",
       "                               'used': 2,\n",
       "                               'Roman': 1,\n",
       "                               'test-practice': 1,\n",
       "                               'Close': 1,\n",
       "                               'Test-preparation': 1,\n",
       "                               'school-sponsored': 1,\n",
       "                               'Standardized': 1,\n",
       "                               'eighth': 1,\n",
       "                               'test-prep': 1,\n",
       "                               'known': 1,\n",
       "                               'test-preparation': 1,\n",
       "                               'coincidental': 1,\n",
       "                               '69-point': 1,\n",
       "                               'the': 5,\n",
       "                               'geometrical': 1,\n",
       "                               'metric': 3,\n",
       "                               'two-letter': 1,\n",
       "                               'consonant': 1,\n",
       "                               'close': 7,\n",
       "                               'outraged': 1,\n",
       "                               'parallel': 1,\n",
       "                               'unaware': 1,\n",
       "                               'Sacramento-based': 1,\n",
       "                               'north': 1,\n",
       "                               'central': 6,\n",
       "                               'ancillary': 1,\n",
       "                               'fetal-tissue': 8,\n",
       "                               'Medical': 1,\n",
       "                               'fetal': 3,\n",
       "                               'juvenile': 1,\n",
       "                               'degenerative': 1,\n",
       "                               'tissue-transplant': 1,\n",
       "                               'acting': 1,\n",
       "                               'scientific': 4,\n",
       "                               'ethical': 3,\n",
       "                               'NIH-appointed': 1,\n",
       "                               'controlled': 1,\n",
       "                               'anti-abortion': 1,\n",
       "                               'prominent': 2,\n",
       "                               'prestigious': 4,\n",
       "                               'Several': 6,\n",
       "                               'ideological': 2,\n",
       "                               'uncharted': 2,\n",
       "                               'middle': 1,\n",
       "                               'funded': 1,\n",
       "                               'visible': 2,\n",
       "                               'damaged': 1,\n",
       "                               'mental': 7,\n",
       "                               'interstate': 6,\n",
       "                               'over-the-counter': 5,\n",
       "                               'lackluster': 1,\n",
       "                               'paltry': 2,\n",
       "                               'inauspicious': 1,\n",
       "                               'daily': 9,\n",
       "                               'nonfinancial': 1,\n",
       "                               'unattractive': 1,\n",
       "                               'head': 1,\n",
       "                               'green': 5,\n",
       "                               'London-based': 4,\n",
       "                               'third-quarter': 2,\n",
       "                               'pretax': 4,\n",
       "                               'related': 3,\n",
       "                               'mobile': 2,\n",
       "                               'one-time': 11,\n",
       "                               'dramatic': 3,\n",
       "                               'near-record': 1,\n",
       "                               'definitive': 1,\n",
       "                               'preferred': 3,\n",
       "                               'nine-member': 2,\n",
       "                               'fiscal': 41,\n",
       "                               'year-earlier': 10,\n",
       "                               'criminal': 7,\n",
       "                               'detailed': 2,\n",
       "                               'organized': 1,\n",
       "                               'attorney-client': 2,\n",
       "                               'punishable': 2,\n",
       "                               'computer-generated': 1,\n",
       "                               'certified': 1,\n",
       "                               'grand': 1,\n",
       "                               'moderate': 6,\n",
       "                               'Justice': 1,\n",
       "                               '8300': 1,\n",
       "                               'confidential': 3,\n",
       "                               'FEDERAL': 1,\n",
       "                               'JUDICIAL': 1,\n",
       "                               'lucrative': 3,\n",
       "                               'Federal': 1,\n",
       "                               'unjust': 2,\n",
       "                               'professional': 2,\n",
       "                               'sudden': 2,\n",
       "                               'high-priced': 3,\n",
       "                               'laughing': 1,\n",
       "                               'collective-bargaining': 1,\n",
       "                               'disciplinary': 4,\n",
       "                               'year-long': 1,\n",
       "                               'unjustified': 2,\n",
       "                               'family-planning': 2,\n",
       "                               'abortion-related': 1,\n",
       "                               'pregnant': 1,\n",
       "                               'homosexual': 2,\n",
       "                               'judicial': 3,\n",
       "                               '18-year-old': 1,\n",
       "                               'teenage': 1,\n",
       "                               'impartial': 1,\n",
       "                               'stock-manipulation': 1,\n",
       "                               'eight-count': 1,\n",
       "                               'planned': 1,\n",
       "                               'three-lawyer': 1,\n",
       "                               '520-lawyer': 1,\n",
       "                               'white-collar': 1,\n",
       "                               'square': 2,\n",
       "                               'cutthroat': 2,\n",
       "                               'municipal': 2,\n",
       "                               'tie-breaking': 1,\n",
       "                               'computer-system-design': 1,\n",
       "                               'sure': 5,\n",
       "                               'antitrust-law': 1,\n",
       "                               'packed': 1,\n",
       "                               'contrary': 1,\n",
       "                               'sorry': 1,\n",
       "                               'embarrassing': 1,\n",
       "                               'normal': 5,\n",
       "                               'extramarital': 1,\n",
       "                               'growing': 1,\n",
       "                               'low-ball': 1,\n",
       "                               'tense': 2,\n",
       "                               'limited': 2,\n",
       "                               'U.S.-Japan': 1,\n",
       "                               'one-yen': 1,\n",
       "                               'prefectural': 1,\n",
       "                               'Other': 6,\n",
       "                               'wheel-loader': 1,\n",
       "                               'German': 3,\n",
       "                               'computer-aided': 1,\n",
       "                               'metropolitan': 1,\n",
       "                               'industry-wide': 1,\n",
       "                               'custom-chip': 1,\n",
       "                               'extended': 1,\n",
       "                               'economical': 1,\n",
       "                               'appropriate': 1,\n",
       "                               'extraordinary': 5,\n",
       "                               'five-inch': 1,\n",
       "                               'more-efficient': 1,\n",
       "                               'six-inch': 2,\n",
       "                               'dead': 2,\n",
       "                               'slack': 1,\n",
       "                               'bearish': 1,\n",
       "                               'narrow': 1,\n",
       "                               'Dollar-yen': 1,\n",
       "                               'U.S.': 1,\n",
       "                               'solid': 4,\n",
       "                               'vitriolic': 1,\n",
       "                               'undisclosed': 1,\n",
       "                               'Great': 3,\n",
       "                               'forthcoming': 1,\n",
       "                               'yen-denominated': 1,\n",
       "                               'unclear': 1,\n",
       "                               'high-yield': 4,\n",
       "                               'unabated': 1,\n",
       "                               'minimal': 1,\n",
       "                               'willing': 8,\n",
       "                               'pre-emptive': 1,\n",
       "                               'NBC-owned': 1,\n",
       "                               'disappointed': 1,\n",
       "                               'uncomfortable': 1,\n",
       "                               'Atlanta-based': 1,\n",
       "                               'conventional': 5,\n",
       "                               'frantic': 1,\n",
       "                               'revenue-desperate': 1,\n",
       "                               'cozy': 1,\n",
       "                               'advertorial': 1,\n",
       "                               'how-to': 1,\n",
       "                               'explanatory': 1,\n",
       "                               'hard-hitting': 1,\n",
       "                               'alleged': 4,\n",
       "                               'considerable': 5,\n",
       "                               'whirling': 1,\n",
       "                               'would-be': 1,\n",
       "                               'furious': 1,\n",
       "                               'giant': 4,\n",
       "                               'non-biodegradable': 1,\n",
       "                               'journalistic': 1,\n",
       "                               'big-time': 1,\n",
       "                               'Individual': 1,\n",
       "                               'yearly': 1,\n",
       "                               'original': 4,\n",
       "                               'consumer-driven': 1,\n",
       "                               'pick-up': 1,\n",
       "                               'drop-off': 1,\n",
       "                               '70-a-share': 1,\n",
       "                               'buy-back': 1,\n",
       "                               'tender': 1,\n",
       "                               'Bermuda-based': 1,\n",
       "                               'hostile': 1,\n",
       "                               'asset-sale': 1,\n",
       "                               'conditional': 2,\n",
       "                               'superior': 2,\n",
       "                               'light': 12,\n",
       "                               'lap-shoulder': 1,\n",
       "                               'rear': 1,\n",
       "                               'front': 2,\n",
       "                               'ongoing': 3,\n",
       "                               'surprising': 5,\n",
       "                               'car-safety': 1,\n",
       "                               'systematic': 2,\n",
       "                               'light-truck': 2,\n",
       "                               'minimum': 11,\n",
       "                               'roof-crush': 4,\n",
       "                               'automatic': 3,\n",
       "                               'side-crash': 1,\n",
       "                               'unloaded': 1,\n",
       "                               'auto-safety': 1,\n",
       "                               'sport-utility': 1,\n",
       "                               'multilevel': 1,\n",
       "                               '58-year-old': 1,\n",
       "                               'formal': 2,\n",
       "                               'longstanding': 1,\n",
       "                               'Later': 1,\n",
       "                               'interesting': 6,\n",
       "                               'hot': 2,\n",
       "                               'merger-related': 1,\n",
       "                               'real-estate': 1,\n",
       "                               'payable': 1,\n",
       "                               'N.J.-based': 1,\n",
       "                               'year-ago': 2,\n",
       "                               'anti-takeover': 1,\n",
       "                               '51-year-old': 1,\n",
       "                               'exceptional': 1,\n",
       "                               'deluxe': 1,\n",
       "                               'flashy': 1,\n",
       "                               'precious': 3,\n",
       "                               'three-digit': 1,\n",
       "                               '10th': 1,\n",
       "                               'scarce': 1,\n",
       "                               'wholesale': 1,\n",
       "                               'retail': 6,\n",
       "                               're-thought': 1,\n",
       "                               'six-bottle': 1,\n",
       "                               'thin': 6,\n",
       "                               'suburban': 1,\n",
       "                               'astronomical': 1,\n",
       "                               'knowledgeable': 1,\n",
       "                               'beautiful': 4,\n",
       "                               'wine-buying': 1,\n",
       "                               'clear': 12,\n",
       "                               'free-lance': 1,\n",
       "                               'upward': 1,\n",
       "                               'fourth': 11,\n",
       "                               'downward': 1,\n",
       "                               'weak': 4,\n",
       "                               'Retail': 1,\n",
       "                               'discretionary': 2,\n",
       "                               'big-ticket': 1,\n",
       "                               'congressional': 10,\n",
       "                               'partisan': 1,\n",
       "                               'entangled': 1,\n",
       "                               'imperative': 1,\n",
       "                               'three-year': 2,\n",
       "                               '10-year': 4,\n",
       "                               '30-year': 11,\n",
       "                               '36-day': 1,\n",
       "                               'when-issued': 1,\n",
       "                               'two-year': 6,\n",
       "                               'five-year': 2,\n",
       "                               'pre-cooked': 1,\n",
       "                               'Long-term': 1,\n",
       "                               'Economic': 1,\n",
       "                               'Sept.': 1,\n",
       "                               'Net': 5,\n",
       "                               'various': 6,\n",
       "                               'proof': 1,\n",
       "                               'aggressive': 4,\n",
       "                               'unchanged': 11,\n",
       "                               'junk-bond': 1,\n",
       "                               'friendly': 4,\n",
       "                               'nominal': 1,\n",
       "                               'punitive': 1,\n",
       "                               'unfettered': 1,\n",
       "                               'heated': 1,\n",
       "                               'direct-investment': 1,\n",
       "                               'half-hour': 2,\n",
       "                               'automotive-lighting': 1,\n",
       "                               'disproportionate': 1,\n",
       "                               'anxious': 2,\n",
       "                               'successful': 5,\n",
       "                               'quick': 3,\n",
       "                               'basic': 3,\n",
       "                               'controversial': 4,\n",
       "                               'high-tech': 3,\n",
       "                               'myriad': 1,\n",
       "                               'tiny': 1,\n",
       "                               'joint-venture': 1,\n",
       "                               'bureaucratic': 1,\n",
       "                               'promising': 1,\n",
       "                               'Heightened': 1,\n",
       "                               'conspicuous': 2,\n",
       "                               'low-tech': 1,\n",
       "                               'strategic': 1,\n",
       "                               'architectural': 1,\n",
       "                               'feudal': 1,\n",
       "                               'Strategic': 1,\n",
       "                               'unsympathetic': 1,\n",
       "                               'content': 1,\n",
       "                               'convenient': 3,\n",
       "                               'high-balance': 1,\n",
       "                               'safe': 1,\n",
       "                               'competitive': 5,\n",
       "                               'pre-approved': 1,\n",
       "                               'cash-flow': 2,\n",
       "                               'elderly': 1,\n",
       "                               'demographic': 2,\n",
       "                               'Varying': 1,\n",
       "                               'athletic': 1,\n",
       "                               'to': 1,\n",
       "                               'active': 7,\n",
       "                               'safe-deposit': 1,\n",
       "                               'profitable': 7,\n",
       "                               'high-rate': 1,\n",
       "                               'standard': 5,\n",
       "                               'interest-bearing': 1,\n",
       "                               'staggering': 1,\n",
       "                               'market-share': 3,\n",
       "                               'money-center': 1,\n",
       "                               'rate-sensitive': 1,\n",
       "                               'costly': 3,\n",
       "                               'loyal': 1,\n",
       "                               'promotional': 1,\n",
       "                               'comprehensive': 1,\n",
       "                               'exercisable': 2,\n",
       "                               'low-cost': 1,\n",
       "                               'peripheral': 4,\n",
       "                               'Hawaiian': 1,\n",
       "                               'lasting': 1,\n",
       "                               'savings-and-loan': 2,\n",
       "                               'needy': 1,\n",
       "                               'solvent': 1,\n",
       "                               'healthy': 4,\n",
       "                               'critical': 1,\n",
       "                               'mid-size': 1,\n",
       "                               'bottom': 1,\n",
       "                               'one-hour': 3,\n",
       "                               '150-point': 1,\n",
       "                               '20-point': 1,\n",
       "                               'tumultuous': 1,\n",
       "                               'stock-index': 9,\n",
       "                               '30-minute': 1,\n",
       "                               '12-point': 3,\n",
       "                               'equal': 5,\n",
       "                               'subsequent': 1,\n",
       "                               '30-point': 2,\n",
       "                               'intermediate': 1,\n",
       "                               'one-day': 2,\n",
       "                               'five-point': 2,\n",
       "                               'post-hearing': 1,\n",
       "                               'program-trading': 9,\n",
       "                               'comfortable': 1,\n",
       "                               'volatile': 4,\n",
       "                               'preset': 2,\n",
       "                               'vague': 1,\n",
       "                               'mushy': 1,\n",
       "                               'sensitive': 1,\n",
       "                               ...}),\n",
       "                     'JJR': FreqDist({'Earlier': 3,\n",
       "                               'Fewer': 1,\n",
       "                               'Higher': 3,\n",
       "                               'Longer': 1,\n",
       "                               'More': 4,\n",
       "                               'Moreover': 1,\n",
       "                               'Shorter': 1,\n",
       "                               'better': 10,\n",
       "                               'bigger': 2,\n",
       "                               'broader': 6,\n",
       "                               'cheaper': 5,\n",
       "                               'cleaner': 2,\n",
       "                               'clearer': 1,\n",
       "                               'closer': 3,\n",
       "                               'colder': 1,\n",
       "                               'earlier': 34,\n",
       "                               'easier': 6,\n",
       "                               'faster': 4,\n",
       "                               'fewer': 6,\n",
       "                               'fuller': 1,\n",
       "                               'further': 1,\n",
       "                               'greater': 11,\n",
       "                               'happier': 1,\n",
       "                               'harder': 4,\n",
       "                               'higher': 47,\n",
       "                               'larger': 7,\n",
       "                               'less': 29,\n",
       "                               'lesser': 1,\n",
       "                               'lighter': 1,\n",
       "                               'longer': 4,\n",
       "                               'lower': 30,\n",
       "                               'more': 111,\n",
       "                               'newer': 1,\n",
       "                               'older': 5,\n",
       "                               'richer': 1,\n",
       "                               'riskier': 1,\n",
       "                               'savvier': 1,\n",
       "                               'sharper': 1,\n",
       "                               'slower': 4,\n",
       "                               'smaller': 8,\n",
       "                               'softer': 1,\n",
       "                               'steeper': 2,\n",
       "                               'stiffer': 1,\n",
       "                               'stronger': 5,\n",
       "                               'weaker': 3,\n",
       "                               'worse': 3,\n",
       "                               'younger': 2}),\n",
       "                     'JJS': FreqDist({'Most': 6,\n",
       "                               'best': 12,\n",
       "                               'best-selling': 1,\n",
       "                               'biggest': 7,\n",
       "                               'brightest': 1,\n",
       "                               'busiest': 1,\n",
       "                               'cheapest': 1,\n",
       "                               'dirtiest': 2,\n",
       "                               'earliest': 1,\n",
       "                               'fastest': 1,\n",
       "                               'finest': 1,\n",
       "                               'greatest': 2,\n",
       "                               'highest': 8,\n",
       "                               'hottest': 1,\n",
       "                               'largest': 28,\n",
       "                               'latest': 22,\n",
       "                               'least': 24,\n",
       "                               'longest': 1,\n",
       "                               'loudest': 1,\n",
       "                               'loveliest': 1,\n",
       "                               'lowest': 4,\n",
       "                               'most': 42,\n",
       "                               'newest': 1,\n",
       "                               'oldest': 2,\n",
       "                               'priciest': 1,\n",
       "                               'smallest': 1,\n",
       "                               'strongest': 4,\n",
       "                               'third-highest': 1,\n",
       "                               'worst': 4}),\n",
       "                     'LS': FreqDist({'1': 3,\n",
       "                               '2': 3,\n",
       "                               '3': 3,\n",
       "                               '4': 1,\n",
       "                               '5': 1,\n",
       "                               'a': 1,\n",
       "                               'b': 1}),\n",
       "                     'MD': FreqDist({\"'d\": 5,\n",
       "                               \"'ll\": 7,\n",
       "                               'Can': 1,\n",
       "                               'Could': 1,\n",
       "                               'ca': 12,\n",
       "                               'can': 93,\n",
       "                               'could': 120,\n",
       "                               'may': 70,\n",
       "                               'might': 43,\n",
       "                               'must': 19,\n",
       "                               'ought': 3,\n",
       "                               'shall': 7,\n",
       "                               'should': 38,\n",
       "                               'will': 280,\n",
       "                               'wo': 19,\n",
       "                               'would': 209}),\n",
       "                     'NN': FreqDist({'board': 30,\n",
       "                               'director': 32,\n",
       "                               'chairman': 45,\n",
       "                               'group': 43,\n",
       "                               'conglomerate': 3,\n",
       "                               'form': 16,\n",
       "                               'asbestos': 11,\n",
       "                               'cigarette': 4,\n",
       "                               'percentage': 11,\n",
       "                               'cancer': 7,\n",
       "                               'fiber': 1,\n",
       "                               'crocidolite': 5,\n",
       "                               'unit': 36,\n",
       "                               'Micronite': 1,\n",
       "                               'year': 212,\n",
       "                               'today': 22,\n",
       "                               'forum': 2,\n",
       "                               'attention': 8,\n",
       "                               'problem': 30,\n",
       "                               'spokewoman': 1,\n",
       "                               'story': 6,\n",
       "                               'anyone': 6,\n",
       "                               'research': 33,\n",
       "                               'information': 26,\n",
       "                               'risk': 7,\n",
       "                               'team': 17,\n",
       "                               'spokeswoman': 8,\n",
       "                               'paper': 28,\n",
       "                               'type': 11,\n",
       "                               'filter': 1,\n",
       "                               'company': 260,\n",
       "                               'substance': 5,\n",
       "                               'number': 45,\n",
       "                               'total': 9,\n",
       "                               'mesothelioma': 1,\n",
       "                               'lung': 2,\n",
       "                               'asbestosis': 1,\n",
       "                               'morbidity': 1,\n",
       "                               'rate': 41,\n",
       "                               'finding': 4,\n",
       "                               'factory': 12,\n",
       "                               'plant': 21,\n",
       "                               'contract': 36,\n",
       "                               'Lorillard': 1,\n",
       "                               'class': 8,\n",
       "                               'kind': 12,\n",
       "                               'chrysotile': 2,\n",
       "                               'standard': 2,\n",
       "                               'regulation': 3,\n",
       "                               'professor': 8,\n",
       "                               'pathlogy': 1,\n",
       "                               'body': 2,\n",
       "                               'ban': 10,\n",
       "                               'burlap': 1,\n",
       "                               'material': 10,\n",
       "                               'bin': 1,\n",
       "                               'cotton': 1,\n",
       "                               'acetate': 1,\n",
       "                               'process': 13,\n",
       "                               'dust': 1,\n",
       "                               'exhaust': 1,\n",
       "                               'area': 9,\n",
       "                               'question': 12,\n",
       "                               'vice': 43,\n",
       "                               'president': 133,\n",
       "                               'place': 17,\n",
       "                               'bearing': 1,\n",
       "                               'work': 19,\n",
       "                               'force': 16,\n",
       "                               'portfolio': 9,\n",
       "                               'interest': 53,\n",
       "                               'compound': 4,\n",
       "                               'yield': 20,\n",
       "                               'fraction': 1,\n",
       "                               'point': 26,\n",
       "                               '%': 445,\n",
       "                               'week': 55,\n",
       "                               'Compound': 1,\n",
       "                               'reinvestment': 1,\n",
       "                               'maturity': 3,\n",
       "                               'day': 23,\n",
       "                               'period': 25,\n",
       "                               'sign': 9,\n",
       "                               'indicator': 4,\n",
       "                               'market': 176,\n",
       "                               'editor': 11,\n",
       "                               'auction': 5,\n",
       "                               'example': 27,\n",
       "                               'cash': 43,\n",
       "                               'money': 53,\n",
       "                               'money-fund': 1,\n",
       "                               'fund': 11,\n",
       "                               'management': 22,\n",
       "                               'acquisition': 15,\n",
       "                               'share': 116,\n",
       "                               'thrift': 18,\n",
       "                               'approval': 10,\n",
       "                               'transaction': 20,\n",
       "                               'year-end': 2,\n",
       "                               'sale': 27,\n",
       "                               'engineering': 8,\n",
       "                               'industry': 41,\n",
       "                               'revenue': 11,\n",
       "                               'government': 83,\n",
       "                               'ceiling': 10,\n",
       "                               'debt': 46,\n",
       "                               'authority': 12,\n",
       "                               'borrowing': 3,\n",
       "                               'midnight': 2,\n",
       "                               'Legislation': 1,\n",
       "                               'fight': 3,\n",
       "                               'manager': 27,\n",
       "                               'marketing': 14,\n",
       "                               'arm': 3,\n",
       "                               'auto': 13,\n",
       "                               'maker': 28,\n",
       "                               'position': 12,\n",
       "                               'service': 24,\n",
       "                               'division': 24,\n",
       "                               'executive': 40,\n",
       "                               'time': 62,\n",
       "                               'powwow': 1,\n",
       "                               'nation': 25,\n",
       "                               'resort': 2,\n",
       "                               'capital': 32,\n",
       "                               'fall': 15,\n",
       "                               'meeting': 16,\n",
       "                               'city': 17,\n",
       "                               'royalty': 1,\n",
       "                               'rock': 1,\n",
       "                               'idea': 11,\n",
       "                               'course': 11,\n",
       "                               'decision': 19,\n",
       "                               'buckle': 1,\n",
       "                               'end': 23,\n",
       "                               'message': 4,\n",
       "                               'evening': 4,\n",
       "                               'guest': 1,\n",
       "                               'pianist-comedian': 1,\n",
       "                               'Champagne': 1,\n",
       "                               'dessert': 1,\n",
       "                               'morning': 4,\n",
       "                               'police': 2,\n",
       "                               'escort': 1,\n",
       "                               'traffic': 1,\n",
       "                               'governor': 3,\n",
       "                               'lieutenant': 1,\n",
       "                               'buffet': 1,\n",
       "                               'breakfast': 1,\n",
       "                               'museum': 2,\n",
       "                               'food': 16,\n",
       "                               'honor': 2,\n",
       "                               'speedway': 1,\n",
       "                               'announcer': 5,\n",
       "                               'exhibition': 2,\n",
       "                               'race': 3,\n",
       "                               'space': 9,\n",
       "                               'sponsor': 2,\n",
       "                               'name': 7,\n",
       "                               'downtown': 2,\n",
       "                               'hotel': 3,\n",
       "                               'dinner': 2,\n",
       "                               'dancing': 1,\n",
       "                               'block': 3,\n",
       "                               'ballroom': 1,\n",
       "                               'town': 3,\n",
       "                               'duckling': 1,\n",
       "                               'mousseline': 1,\n",
       "                               'lobster': 1,\n",
       "                               'consomme': 1,\n",
       "                               'veal': 1,\n",
       "                               'mignon': 1,\n",
       "                               'terrine': 1,\n",
       "                               'raspberry': 1,\n",
       "                               'sauce': 1,\n",
       "                               'meal': 2,\n",
       "                               'ovation': 1,\n",
       "                               'treatment': 9,\n",
       "                               'heartland': 1,\n",
       "                               'winter': 1,\n",
       "                               'trade': 38,\n",
       "                               'deficit': 6,\n",
       "                               'country': 46,\n",
       "                               'sluggishness': 1,\n",
       "                               'setback': 2,\n",
       "                               'cloud': 1,\n",
       "                               'economy': 26,\n",
       "                               'increase': 20,\n",
       "                               'boom': 2,\n",
       "                               'labor': 5,\n",
       "                               'Government': 2,\n",
       "                               'target': 8,\n",
       "                               'forecast': 4,\n",
       "                               'surplus': 2,\n",
       "                               'pace': 6,\n",
       "                               'magazine': 23,\n",
       "                               'advertising': 10,\n",
       "                               'incentive': 4,\n",
       "                               'plan': 45,\n",
       "                               'ad': 28,\n",
       "                               'spending': 24,\n",
       "                               'news': 24,\n",
       "                               'competition': 10,\n",
       "                               'page': 5,\n",
       "                               'circulation': 10,\n",
       "                               'base': 9,\n",
       "                               'subscriber': 1,\n",
       "                               'renewal': 1,\n",
       "                               'attempt': 8,\n",
       "                               'decline': 14,\n",
       "                               'drop': 15,\n",
       "                               'department': 27,\n",
       "                               'use': 17,\n",
       "                               'none': 4,\n",
       "                               'decrease': 2,\n",
       "                               'bidding': 6,\n",
       "                               'payoff': 1,\n",
       "                               'future': 8,\n",
       "                               'offer': 37,\n",
       "                               'move': 18,\n",
       "                               'reorganization': 9,\n",
       "                               'Chapter': 4,\n",
       "                               'bankruptcy': 9,\n",
       "                               'value': 24,\n",
       "                               'bid': 31,\n",
       "                               'officer': 32,\n",
       "                               'return': 22,\n",
       "                               'equity': 17,\n",
       "                               'growth': 39,\n",
       "                               'electricity': 4,\n",
       "                               'demand': 28,\n",
       "                               'operating': 15,\n",
       "                               'way': 30,\n",
       "                               'matter': 13,\n",
       "                               'adviser': 5,\n",
       "                               'withdrawal': 3,\n",
       "                               'fact': 15,\n",
       "                               'state': 31,\n",
       "                               'field': 10,\n",
       "                               'request': 8,\n",
       "                               'purchase': 23,\n",
       "                               'review': 10,\n",
       "                               'summer': 8,\n",
       "                               'one': 9,\n",
       "                               'court': 35,\n",
       "                               'yesterday': 61,\n",
       "                               'trading': 144,\n",
       "                               'chief': 41,\n",
       "                               'consumer': 13,\n",
       "                               'retailing': 3,\n",
       "                               'chain': 8,\n",
       "                               'undersecretary': 2,\n",
       "                               'cost': 12,\n",
       "                               'power': 25,\n",
       "                               'refund': 6,\n",
       "                               'utility': 5,\n",
       "                               'State': 1,\n",
       "                               'order': 18,\n",
       "                               'pool': 1,\n",
       "                               'hostage': 1,\n",
       "                               'round': 5,\n",
       "                               'commission': 8,\n",
       "                               'amount': 19,\n",
       "                               'ruling': 12,\n",
       "                               'spokesman': 39,\n",
       "                               'nightmare': 1,\n",
       "                               'challenge': 3,\n",
       "                               'construction': 31,\n",
       "                               'month': 44,\n",
       "                               'precedent': 4,\n",
       "                               'case': 29,\n",
       "                               'performance': 18,\n",
       "                               'record': 25,\n",
       "                               'passenger': 3,\n",
       "                               'price': 66,\n",
       "                               'introduction': 8,\n",
       "                               'consumption': 1,\n",
       "                               'tax': 17,\n",
       "                               'control': 16,\n",
       "                               'motor': 2,\n",
       "                               'household': 3,\n",
       "                               'survival': 4,\n",
       "                               'spinoff': 8,\n",
       "                               'fledgling': 1,\n",
       "                               'supercomputer': 5,\n",
       "                               'business': 76,\n",
       "                               'creativity': 2,\n",
       "                               'longevity': 1,\n",
       "                               'designer': 4,\n",
       "                               'development': 18,\n",
       "                               'machine': 7,\n",
       "                               'balance': 5,\n",
       "                               'sheet': 3,\n",
       "                               'financing': 8,\n",
       "                               'firm': 38,\n",
       "                               'project': 5,\n",
       "                               'prototype': 1,\n",
       "                               'choice': 2,\n",
       "                               'interview': 10,\n",
       "                               'theory': 3,\n",
       "                               'scenario': 2,\n",
       "                               'filing': 9,\n",
       "                               'stock': 136,\n",
       "                               'note': 7,\n",
       "                               'presence': 6,\n",
       "                               'valuation': 2,\n",
       "                               'investor': 39,\n",
       "                               'concept': 6,\n",
       "                               'age': 12,\n",
       "                               'chip': 5,\n",
       "                               'technology': 8,\n",
       "                               'gallium': 1,\n",
       "                               'arsenide': 1,\n",
       "                               'handling': 5,\n",
       "                               'equipment': 10,\n",
       "                               'addition': 23,\n",
       "                               'C-90': 1,\n",
       "                               'competitor': 3,\n",
       "                               'range': 6,\n",
       "                               'distribution': 5,\n",
       "                               'marketplace': 5,\n",
       "                               'book': 7,\n",
       "                               'drain': 2,\n",
       "                               'profit': 54,\n",
       "                               'hand': 8,\n",
       "                               'loss': 32,\n",
       "                               'comment': 11,\n",
       "                               'contractor': 3,\n",
       "                               'arrangement': 3,\n",
       "                               'father': 4,\n",
       "                               'A.': 2,\n",
       "                               'software': 14,\n",
       "                               'hardware': 5,\n",
       "                               'electric-utility': 1,\n",
       "                               'holding': 3,\n",
       "                               'success': 3,\n",
       "                               'diplomacy': 1,\n",
       "                               'list': 10,\n",
       "                               'priority': 4,\n",
       "                               'watch': 4,\n",
       "                               'result': 10,\n",
       "                               'law': 37,\n",
       "                               'protection': 6,\n",
       "                               'property': 5,\n",
       "                               'spring': 8,\n",
       "                               'scrutiny': 3,\n",
       "                               'progress': 6,\n",
       "                               'issue': 54,\n",
       "                               'realization': 2,\n",
       "                               'world': 22,\n",
       "                               'denial': 1,\n",
       "                               'inventiveness': 1,\n",
       "                               'high-technology': 1,\n",
       "                               'task': 3,\n",
       "                               'enforcement': 11,\n",
       "                               'movie': 8,\n",
       "                               'standing': 5,\n",
       "                               'copyright': 3,\n",
       "                               'agreement': 17,\n",
       "                               'trademark': 1,\n",
       "                               'legislation': 22,\n",
       "                               'measure': 10,\n",
       "                               'part': 39,\n",
       "                               'computer': 23,\n",
       "                               'hook': 2,\n",
       "                               'concern': 41,\n",
       "                               'patent': 10,\n",
       "                               'lawyer': 8,\n",
       "                               'threat': 2,\n",
       "                               'retaliation': 1,\n",
       "                               'recognition': 3,\n",
       "                               'videocassette': 2,\n",
       "                               'piracy': 1,\n",
       "                               'disregard': 1,\n",
       "                               'act': 6,\n",
       "                               'investigation': 5,\n",
       "                               'provision': 8,\n",
       "                               'creditor': 2,\n",
       "                               'declaration': 1,\n",
       "                               'action': 27,\n",
       "                               'official': 17,\n",
       "                               'stature': 2,\n",
       "                               'reduction': 8,\n",
       "                               'negotiator': 1,\n",
       "                               'office': 23,\n",
       "                               'principal': 11,\n",
       "                               'centennial': 1,\n",
       "                               'century': 3,\n",
       "                               'history': 11,\n",
       "                               'face': 10,\n",
       "                               'computing': 2,\n",
       "                               'television': 9,\n",
       "                               'advance': 6,\n",
       "                               'garage': 1,\n",
       "                               'product': 21,\n",
       "                               'desktop': 1,\n",
       "                               'home': 17,\n",
       "                               'mainframe': 1,\n",
       "                               'memory': 4,\n",
       "                               'capacity': 14,\n",
       "                               'pioneer': 2,\n",
       "                               'PC': 3,\n",
       "                               'system': 17,\n",
       "                               'billionaire': 1,\n",
       "                               'disk': 3,\n",
       "                               'telephone': 10,\n",
       "                               'leader': 5,\n",
       "                               'Today': 6,\n",
       "                               'affiliate': 4,\n",
       "                               'label': 1,\n",
       "                               'voting': 2,\n",
       "                               'stake': 23,\n",
       "                               'right': 22,\n",
       "                               'Oil': 1,\n",
       "                               'production': 22,\n",
       "                               'launch': 3,\n",
       "                               'venture': 5,\n",
       "                               'Output': 1,\n",
       "                               'Esso': 1,\n",
       "                               'subsidiary': 7,\n",
       "                               'gelatin': 1,\n",
       "                               'program': 127,\n",
       "                               'response': 6,\n",
       "                               'petition': 2,\n",
       "                               'tariff': 2,\n",
       "                               'status': 4,\n",
       "                               'potential': 3,\n",
       "                               'injury': 1,\n",
       "                               'producer': 5,\n",
       "                               'seller': 2,\n",
       "                               'aide': 4,\n",
       "                               'manufacturer': 4,\n",
       "                               'effort': 11,\n",
       "                               'overhead': 1,\n",
       "                               'level': 20,\n",
       "                               'finance': 13,\n",
       "                               'expansion': 6,\n",
       "                               'load': 1,\n",
       "                               'downturn': 5,\n",
       "                               'dividend': 23,\n",
       "                               'high': 3,\n",
       "                               'founder': 5,\n",
       "                               'shareholder': 12,\n",
       "                               'seat': 5,\n",
       "                               'role': 11,\n",
       "                               'organization': 10,\n",
       "                               'restructuring': 17,\n",
       "                               'consulting': 4,\n",
       "                               'career': 5,\n",
       "                               'chemical': 4,\n",
       "                               'mortgage': 5,\n",
       "                               'conference': 12,\n",
       "                               'rest': 6,\n",
       "                               'investment': 56,\n",
       "                               'bank': 38,\n",
       "                               'interbank': 2,\n",
       "                               'prepayment': 2,\n",
       "                               'burden': 2,\n",
       "                               'tenth': 1,\n",
       "                               'oil': 18,\n",
       "                               'judge': 7,\n",
       "                               'steel': 12,\n",
       "                               'aerospace': 7,\n",
       "                               'energy': 8,\n",
       "                               'giant': 1,\n",
       "                               'tender': 4,\n",
       "                               'Montedison': 1,\n",
       "                               'Erbamont': 1,\n",
       "                               'gold': 9,\n",
       "                               'drawing': 2,\n",
       "                               'intensity': 2,\n",
       "                               'intervention': 1,\n",
       "                               'currency': 7,\n",
       "                               'announcement': 10,\n",
       "                               'craze': 3,\n",
       "                               'rash': 1,\n",
       "                               'turf': 1,\n",
       "                               'visit': 5,\n",
       "                               'head': 10,\n",
       "                               'province': 1,\n",
       "                               'Anything': 1,\n",
       "                               'partner': 7,\n",
       "                               'explosion': 2,\n",
       "                               'mania': 1,\n",
       "                               'oblivion': 1,\n",
       "                               'crash': 11,\n",
       "                               'surge': 5,\n",
       "                               'analyst': 27,\n",
       "                               'hoopla': 1,\n",
       "                               'smattering': 1,\n",
       "                               'Country': 1,\n",
       "                               'taste': 1,\n",
       "                               'instance': 7,\n",
       "                               'frenzy': 1,\n",
       "                               'discount': 5,\n",
       "                               'premium': 9,\n",
       "                               'reason': 11,\n",
       "                               'Share': 1,\n",
       "                               'play': 1,\n",
       "                               'integration': 4,\n",
       "                               'exposure': 5,\n",
       "                               'viewpoint': 3,\n",
       "                               'advice': 1,\n",
       "                               'party': 5,\n",
       "                               'repayment': 1,\n",
       "                               'branch': 7,\n",
       "                               'credit': 21,\n",
       "                               'default': 4,\n",
       "                               'key': 2,\n",
       "                               'reflection': 3,\n",
       "                               'survey': 17,\n",
       "                               'manufacturing': 14,\n",
       "                               'index': 64,\n",
       "                               'reading': 10,\n",
       "                               'sector': 17,\n",
       "                               'defense': 12,\n",
       "                               'report': 31,\n",
       "                               'building': 9,\n",
       "                               'activity': 16,\n",
       "                               'inflation': 6,\n",
       "                               'economist': 6,\n",
       "                               'slack': 1,\n",
       "                               'blank': 1,\n",
       "                               'Factory': 3,\n",
       "                               'recession': 11,\n",
       "                               'lack': 6,\n",
       "                               'warning': 3,\n",
       "                               'buildup': 1,\n",
       "                               'front': 5,\n",
       "                               'landing': 2,\n",
       "                               'slowdown': 4,\n",
       "                               'strength': 7,\n",
       "                               'half': 9,\n",
       "                               'Spending': 1,\n",
       "                               'goverment': 1,\n",
       "                               'renovation': 2,\n",
       "                               'purchasing': 5,\n",
       "                               'association': 9,\n",
       "                               'committee': 13,\n",
       "                               'evidence': 13,\n",
       "                               'export': 11,\n",
       "                               'purhasing': 1,\n",
       "                               'delivery': 16,\n",
       "                               'difference': 10,\n",
       "                               'improvement': 6,\n",
       "                               'worsening': 1,\n",
       "                               'trend': 7,\n",
       "                               'supply': 6,\n",
       "                               'dozen': 4,\n",
       "                               'newcomer': 1,\n",
       "                               'milk': 4,\n",
       "                               'powder': 1,\n",
       "                               'thing': 14,\n",
       "                               'row': 2,\n",
       "                               'shortage': 2,\n",
       "                               'dairy': 1,\n",
       "                               'import': 5,\n",
       "                               'article': 6,\n",
       "                               'baby': 1,\n",
       "                               'lot': 12,\n",
       "                               'common': 3,\n",
       "                               'novel': 4,\n",
       "                               'texture': 1,\n",
       "                               'reader': 3,\n",
       "                               'charm': 1,\n",
       "                               'society': 3,\n",
       "                               'lore': 1,\n",
       "                               'author': 4,\n",
       "                               'school': 22,\n",
       "                               'notion': 2,\n",
       "                               'Japanese': 2,\n",
       "                               'plot': 1,\n",
       "                               'reality': 4,\n",
       "                               'hero': 2,\n",
       "                               'snow': 1,\n",
       "                               'search': 1,\n",
       "                               'sheep': 1,\n",
       "                               'star': 2,\n",
       "                               'back': 2,\n",
       "                               'behest': 1,\n",
       "                               'mobster': 1,\n",
       "                               'degree': 2,\n",
       "                               'tow': 1,\n",
       "                               'girlfriend': 1,\n",
       "                               'anything': 12,\n",
       "                               'butterfly': 1,\n",
       "                               'chauffeur': 1,\n",
       "                               'phone': 2,\n",
       "                               'figure': 4,\n",
       "                               'sheepskin': 1,\n",
       "                               'publishing': 9,\n",
       "                               'sensation': 1,\n",
       "                               'brat': 1,\n",
       "                               'pack': 1,\n",
       "                               'best-seller': 1,\n",
       "                               'language': 6,\n",
       "                               'baseball': 3,\n",
       "                               'version': 5,\n",
       "                               'game': 8,\n",
       "                               'mirror': 1,\n",
       "                               'harmony': 2,\n",
       "                               'spirit': 4,\n",
       "                               'player': 1,\n",
       "                               'commitment': 3,\n",
       "                               'practice': 10,\n",
       "                               'image': 3,\n",
       "                               'batting': 1,\n",
       "                               'average': 10,\n",
       "                               'soul': 1,\n",
       "                               'symbol': 2,\n",
       "                               'ball': 1,\n",
       "                               'bat': 1,\n",
       "                               'stadium': 7,\n",
       "                               'strike': 11,\n",
       "                               'zone': 2,\n",
       "                               'size': 10,\n",
       "                               'hitter': 1,\n",
       "                               'shame': 3,\n",
       "                               'defeat': 1,\n",
       "                               'conduct': 1,\n",
       "                               'road': 4,\n",
       "                               'chronicle': 1,\n",
       "                               'plate': 2,\n",
       "                               'complaint': 3,\n",
       "                               'American': 1,\n",
       "                               'regret': 2,\n",
       "                               'lunch': 1,\n",
       "                               'dormitory': 1,\n",
       "                               'caretaker': 1,\n",
       "                               'style': 3,\n",
       "                               'mark': 8,\n",
       "                               'overtime': 1,\n",
       "                               'sake': 1,\n",
       "                               'solidarity': 1,\n",
       "                               'employee': 7,\n",
       "                               'responsibility': 4,\n",
       "                               'science': 1,\n",
       "                               'lesson': 4,\n",
       "                               'crime': 5,\n",
       "                               'appointment': 4,\n",
       "                               'something': 13,\n",
       "                               'deputy': 5,\n",
       "                               'editorial': 6,\n",
       "                               'globe': 3,\n",
       "                               'tobacco': 1,\n",
       "                               'smoke': 1,\n",
       "                               'fine': 24,\n",
       "                               'smoking': 4,\n",
       "                               'fast-food': 5,\n",
       "                               'minister': 4,\n",
       "                               'study': 10,\n",
       "                               'agency': 17,\n",
       "                               'colony': 1,\n",
       "                               'deal': 18,\n",
       "                               'stress': 1,\n",
       "                               'cabinet': 1,\n",
       "                               'proposal': 21,\n",
       "                               'center': 6,\n",
       "                               'membership': 6,\n",
       "                               'application': 5,\n",
       "                               'assistant': 4,\n",
       "                               'mainland': 1,\n",
       "                               'Chinese': 1,\n",
       "                               'sex': 2,\n",
       "                               'man': 12,\n",
       "                               'disease': 4,\n",
       "                               'hospital': 1,\n",
       "                               'family': 21,\n",
       "                               'newspaper': 13,\n",
       "                               'life': 14,\n",
       "                               'gas': 4,\n",
       "                               'line': 13,\n",
       "                               'rise': 9,\n",
       "                               'coal': 2,\n",
       "                               'victory': 2,\n",
       "                               'parliament': 3,\n",
       "                               'dam': 5,\n",
       "                               'damage': 3,\n",
       "                               'twin': 1,\n",
       "                               'twindam': 1,\n",
       "                               'peak': 2,\n",
       "                               'painting': 1,\n",
       "                               'playwright': 1,\n",
       "                               'upturn': 1,\n",
       "                               'bond': 26,\n",
       "                               'estate': 6,\n",
       "                               'warrant': 2,\n",
       "                               'holder': 2,\n",
       "                               'par': 8,\n",
       "                               'date': 6,\n",
       "                               'actor': 1,\n",
       "                               'inheritor': 1,\n",
       "                               'claim': 2,\n",
       "                               'writer': 4,\n",
       "                               'film': 7,\n",
       "                               'student': 10,\n",
       "                               'campus': 1,\n",
       "                               'sketch': 2,\n",
       "                               'artist': 2,\n",
       "                               'piece': 2,\n",
       "                               'tramp': 1,\n",
       "                               'dialogue': 2,\n",
       "                               'person': 13,\n",
       "                               'Composer': 1,\n",
       "                               'college': 3,\n",
       "                               'friend': 4,\n",
       "                               'living': 1,\n",
       "                               'bass': 1,\n",
       "                               'music': 2,\n",
       "                               'score': 2,\n",
       "                               'view': 10,\n",
       "                               'black': 1,\n",
       "                               'white': 1,\n",
       "                               'purpose': 7,\n",
       "                               'strip': 1,\n",
       "                               'crack': 1,\n",
       "                               'cardboard': 2,\n",
       "                               'box': 4,\n",
       "                               'routine': 1,\n",
       "                               'night': 8,\n",
       "                               'girl': 2,\n",
       "                               'charge': 25,\n",
       "                               'waif': 1,\n",
       "                               'mother': 3,\n",
       "                               'child': 3,\n",
       "                               'blessing': 2,\n",
       "                               'curse': 1,\n",
       "                               'sense': 7,\n",
       "                               'inadequacy': 1,\n",
       "                               'romance': 2,\n",
       "                               'woman': 9,\n",
       "                               'shop': 1,\n",
       "                               'apartment': 2,\n",
       "                               'camera': 1,\n",
       "                               'vagabond': 1,\n",
       "                               'existence': 1,\n",
       "                               'sound': 5,\n",
       "                               'street': 4,\n",
       "                               'achievement': 4,\n",
       "                               'picture': 5,\n",
       "                               'character': 2,\n",
       "                               'angle': 2,\n",
       "                               'significance': 1,\n",
       "                               'hypocrisy': 1,\n",
       "                               'traitor': 1,\n",
       "                               'abortionist': 2,\n",
       "                               'jam': 1,\n",
       "                               'cocoa': 1,\n",
       "                               'job': 18,\n",
       "                               'client': 8,\n",
       "                               'remorse': 1,\n",
       "                               'husband': 3,\n",
       "                               'lover': 1,\n",
       "                               'rendering': 1,\n",
       "                               'spot': 3,\n",
       "                               'portrayal': 1,\n",
       "                               'look': 5,\n",
       "                               'twin-jet': 1,\n",
       "                               'aircraft': 2,\n",
       "                               'press': 8,\n",
       "                               'contribution': 1,\n",
       "                               'plane': 1,\n",
       "                               'event': 3,\n",
       "                               'irony': 1,\n",
       "                               'attack': 4,\n",
       "                               'commercial': 6,\n",
       "                               'boost': 3,\n",
       "                               'campaign': 15,\n",
       "                               'election': 2,\n",
       "                               'hostility': 1,\n",
       "                               'mudslinging': 1,\n",
       "                               'era': 3,\n",
       "                               'content': 1,\n",
       "                               'dawn': 1,\n",
       "                               'art': 4,\n",
       "                               'stage': 2,\n",
       "                               'consultant': 3,\n",
       "                               'TV': 10,\n",
       "                               'tone': 2,\n",
       "                               'screen': 4,\n",
       "                               'shot': 2,\n",
       "                               'candidate': 2,\n",
       "                               'mayor': 5,\n",
       "                               'income': 42,\n",
       "                               'male': 2,\n",
       "                               'voice': 8,\n",
       "                               'master': 4,\n",
       "                               'insurance': 18,\n",
       "                               'kidnapper': 1,\n",
       "                               'kicker': 2,\n",
       "                               'corruption': 2,\n",
       "                               'One': 2,\n",
       "                               'truth': 2,\n",
       "                               'Everybody': 1,\n",
       "                               'nobody': 2,\n",
       "                               'situation': 13,\n",
       "                               'oversight': 1,\n",
       "                               'secret': 1,\n",
       "                               'reporting': 2,\n",
       "                               'kidnapping': 1,\n",
       "                               'side': 9,\n",
       "                               'battle': 9,\n",
       "                               'abortion': 13,\n",
       "                               'persuasion': 1,\n",
       "                               'tour': 1,\n",
       "                               'flag': 3,\n",
       "                               'tradition': 2,\n",
       "                               'freedom': 3,\n",
       "                               'liberty': 1,\n",
       "                               'statue': 1,\n",
       "                               'rape': 5,\n",
       "                               'incest': 1,\n",
       "                               'referendum': 2,\n",
       "                               'attorney': 6,\n",
       "                               'general': 2,\n",
       "                               'series': 12,\n",
       "                               'support': 12,\n",
       "                               'counterattack': 1,\n",
       "                               'close-up': 1,\n",
       "                               'courtroom': 2,\n",
       "                               'ordeal': 1,\n",
       "                               'bill': 33,\n",
       "                               'constituent': 1,\n",
       "                               'technique': 1,\n",
       "                               'interrogation': 1,\n",
       "                               'stigma': 1,\n",
       "                               'campaigner': 1,\n",
       "                               'scientist': 2,\n",
       "                               'onus': 1,\n",
       "                               'campaigning': 2,\n",
       "                               'remainder': 3,\n",
       "                               'season': 3,\n",
       "                               'truce': 3,\n",
       "                               'sensitivity': 1,\n",
       "                               'photograph': 1,\n",
       "                               'rival': 4,\n",
       "                               'focus': 4,\n",
       "                               'waste': 3,\n",
       "                               'fraud': 2,\n",
       "                               'nose': 3,\n",
       "                               'barrel': 3,\n",
       "                               'land': 3,\n",
       "                               'heating': 6,\n",
       "                               'pollution': 1,\n",
       "                               'environment': 7,\n",
       "                               'credibility': 2,\n",
       "                               'route': 1,\n",
       "                               're-election': 2,\n",
       "                               'rout': 1,\n",
       "                               'exchange': 19,\n",
       "                               'region': 16,\n",
       "                               'cooperation': 3,\n",
       "                               'domination': 2,\n",
       "                               'policy': 15,\n",
       "                               'flow': 5,\n",
       "                               'motion': 4,\n",
       "                               'assistance': 7,\n",
       "                               'lead': 6,\n",
       "                               'influence': 5,\n",
       "                               'hegemony': 1,\n",
       "                               'budget': 15,\n",
       "                               'ground': 4,\n",
       "                               'decade': 7,\n",
       "                               'behemoth': 1,\n",
       "                               'evolution': 2,\n",
       "                               'past': 8,\n",
       "                               'aid': 13,\n",
       "                               'donor': 2,\n",
       "                               'lender': 1,\n",
       "                               'approach': 6,\n",
       "                               'specialist': 7,\n",
       "                               'effect': 18,\n",
       "                               'Asia': 1,\n",
       "                               'framework': 1,\n",
       "                               'transportation': 4,\n",
       "                               'telecommunications': 1,\n",
       "                               'rim': 1,\n",
       "                               'speech': 4,\n",
       "                               'intention': 3,\n",
       "                               'shape': 3,\n",
       "                               'architecture': 3,\n",
       "                               'dominance': 1,\n",
       "                               'optimism': 3,\n",
       "                               'undertone': 1,\n",
       "                               'caution': 2,\n",
       "                               'understanding': 3,\n",
       "                               'commerce': 2,\n",
       "                               'attitude': 2,\n",
       "                               'gain': 15,\n",
       "                               'everyone': 2,\n",
       "                               'security': 7,\n",
       "                               'uncertainty': 6,\n",
       "                               'troop': 1,\n",
       "                               'counterweight': 1,\n",
       "                               'juggernaut': 1,\n",
       "                               'Test': 3,\n",
       "                               'cheating': 9,\n",
       "                               'stockbroker': 1,\n",
       "                               'profession': 1,\n",
       "                               'word': 4,\n",
       "                               'social-studies': 2,\n",
       "                               'section': 6,\n",
       "                               'test': 34,\n",
       "                               'protest': 2,\n",
       "                               'teacher': 13,\n",
       "                               'examination': 5,\n",
       "                               'geography': 5,\n",
       "                               'projector': 1,\n",
       "                               'alternative': 5,\n",
       "                               'jail': 3,\n",
       "                               'downfall': 1,\n",
       "                               'wake': 5,\n",
       "                               'bitterness': 1,\n",
       "                               'anger': 1,\n",
       "                               'betrayer': 1,\n",
       "                               'school-district': 1,\n",
       "                               'nature': 5,\n",
       "                               'martyr': 1,\n",
       "                               'light': 4,\n",
       "                               'reform': 7,\n",
       "                               'testing': 10,\n",
       "                               'temptation': 2,\n",
       "                               'statute': 3,\n",
       "                               'bonus': 6,\n",
       "                               'ability': 12,\n",
       "                               'pressure': 17,\n",
       "                               'education': 6,\n",
       "                               'wrongdoing': 7,\n",
       "                               'Evidence': 1,\n",
       "                               'adult': 2,\n",
       "                               'help': 4,\n",
       "                               'classroom': 7,\n",
       "                               'instruction': 2,\n",
       "                               'nothing': 9,\n",
       "                               'crib': 2,\n",
       "                               'Use': 1,\n",
       "                               'district': 11,\n",
       "                               'lab': 1,\n",
       "                               'superintendent': 1,\n",
       "                               'entrance': 1,\n",
       "                               'foundation': 1,\n",
       "                               'abuse': 5,\n",
       "                               'track': 1,\n",
       "                               'achievement-test': 1,\n",
       "                               'preparation': 4,\n",
       "                               'hill': 1,\n",
       "                               'textile': 3,\n",
       "                               'physicist': 2,\n",
       "                               'actress': 1,\n",
       "                               '1980s': 1,\n",
       "                               'glory': 1,\n",
       "                               'facade': 1,\n",
       "                               'violence': 2,\n",
       "                               'Crime': 1,\n",
       "                               'enrollment': 1,\n",
       "                               'predecessor': 2,\n",
       "                               'breakdown': 1,\n",
       "                               'term': 12,\n",
       "                               'death': 6,\n",
       "                               'trouble': 5,\n",
       "                               'elite': 1,\n",
       "                               'deadwood': 1,\n",
       "                               'faculty': 2,\n",
       "                               'safety': 23,\n",
       "                               'behalf': 2,\n",
       "                               'funding': 18,\n",
       "                               'betterment': 1,\n",
       "                               'dismissal': 1,\n",
       "                               'staff': 9,\n",
       "                               'curriculum': 3,\n",
       "                               'pay': 8,\n",
       "                               'cadet': 2,\n",
       "                               'creation': 3,\n",
       "                               'teaching': 4,\n",
       "                               'grant': 1,\n",
       "                               'pep': 1,\n",
       "                               'club': 3,\n",
       "                               'Literacy': 1,\n",
       "                               'Civilization': 2,\n",
       "                               'Teacher': 1,\n",
       "                               'Year': 2,\n",
       "                               'lady': 2,\n",
       "                               'freshman': 1,\n",
       "                               'grader': 1,\n",
       "                               'senior': 2,\n",
       "                               'college-bowl': 1,\n",
       "                               'furniture': 2,\n",
       "                               'homework': 1,\n",
       "                               'football': 2,\n",
       "                               'grandstander': 1,\n",
       "                               'hearing': 7,\n",
       "                               'incentive-bonus': 1,\n",
       "                               'source': 6,\n",
       "                               'salary': 5,\n",
       "                               'pride': 1,\n",
       "                               'seminar': 2,\n",
       "                               'mistake': 2,\n",
       "                               'sociology': 1,\n",
       "                               'bottom': 4,\n",
       "                               'self-esteem': 1,\n",
       "                               ...}),\n",
       "                     'NNP': FreqDist({'Pierre': 1,\n",
       "                               'Vinken': 2,\n",
       "                               'Nov.': 23,\n",
       "                               'Mr.': 375,\n",
       "                               'Elsevier': 1,\n",
       "                               'N.V.': 3,\n",
       "                               'Dutch': 1,\n",
       "                               'Rudolph': 3,\n",
       "                               'Agnew': 1,\n",
       "                               'Consolidated': 2,\n",
       "                               'Gold': 2,\n",
       "                               'Fields': 2,\n",
       "                               'PLC': 13,\n",
       "                               'Kent': 8,\n",
       "                               'Lorillard': 4,\n",
       "                               'Inc.': 97,\n",
       "                               'Loews': 1,\n",
       "                               'Corp.': 117,\n",
       "                               'New': 159,\n",
       "                               'England': 23,\n",
       "                               'Journal': 10,\n",
       "                               'Medicine': 5,\n",
       "                               'James': 22,\n",
       "                               'A.': 16,\n",
       "                               'Talcott': 4,\n",
       "                               'Boston': 17,\n",
       "                               'Dana-Farber': 1,\n",
       "                               'Cancer': 2,\n",
       "                               'Institute': 15,\n",
       "                               'Dr.': 13,\n",
       "                               'National': 20,\n",
       "                               'Harvard': 3,\n",
       "                               'University': 22,\n",
       "                               'West': 10,\n",
       "                               'Groton': 1,\n",
       "                               'Mass.': 8,\n",
       "                               'Hollingsworth': 2,\n",
       "                               'Vose': 2,\n",
       "                               'Co.': 74,\n",
       "                               'U.S.': 220,\n",
       "                               'Brooke': 1,\n",
       "                               'T.': 11,\n",
       "                               'Mossman': 2,\n",
       "                               'Vermont': 1,\n",
       "                               'College': 6,\n",
       "                               'July': 8,\n",
       "                               'Environmental': 1,\n",
       "                               'Protection': 1,\n",
       "                               'Agency': 5,\n",
       "                               'Darrell': 1,\n",
       "                               'Phillips': 2,\n",
       "                               'IBC': 1,\n",
       "                               'Money': 3,\n",
       "                               'Fund': 12,\n",
       "                               'Report': 8,\n",
       "                               'Tuesday': 46,\n",
       "                               'August': 18,\n",
       "                               'Donoghue': 1,\n",
       "                               'Brenda': 1,\n",
       "                               'Malizia': 1,\n",
       "                               'Negus': 1,\n",
       "                               'Treasury': 41,\n",
       "                               'Monday': 12,\n",
       "                               'Dreyfus': 1,\n",
       "                               'World-Wide': 1,\n",
       "                               'Dollar': 1,\n",
       "                               'J.P.': 1,\n",
       "                               'Bolduc': 1,\n",
       "                               'W.R.': 3,\n",
       "                               'Grace': 4,\n",
       "                               'Terrence': 1,\n",
       "                               'D.': 15,\n",
       "                               'Daniels': 1,\n",
       "                               'Energy': 6,\n",
       "                               'Pacific': 10,\n",
       "                               'First': 35,\n",
       "                               'Financial': 14,\n",
       "                               'Royal': 1,\n",
       "                               'Trustco': 1,\n",
       "                               'Ltd.': 19,\n",
       "                               'Toronto': 5,\n",
       "                               'McDermott': 1,\n",
       "                               'International': 33,\n",
       "                               'Babcock': 1,\n",
       "                               'Wilcox': 1,\n",
       "                               'Bailey': 3,\n",
       "                               'Controls': 2,\n",
       "                               'Operations': 1,\n",
       "                               'Finmeccanica': 2,\n",
       "                               'S.p': 1,\n",
       "                               'Wickliffe': 1,\n",
       "                               'Ohio': 9,\n",
       "                               'Congress': 46,\n",
       "                               'House': 55,\n",
       "                               'Senate': 18,\n",
       "                               'Clark': 1,\n",
       "                               'J.': 15,\n",
       "                               'Vitulli': 2,\n",
       "                               'Mazda': 2,\n",
       "                               'Motor': 7,\n",
       "                               'Corp': 11,\n",
       "                               'Chrysler': 6,\n",
       "                               'Boca': 3,\n",
       "                               'Raton': 2,\n",
       "                               'Hot': 1,\n",
       "                               'Springs': 2,\n",
       "                               'Association': 21,\n",
       "                               'Manufacturers': 1,\n",
       "                               'Hoosier': 1,\n",
       "                               'Indianapolis': 4,\n",
       "                               'Rust': 1,\n",
       "                               'Belt': 3,\n",
       "                               'Du': 2,\n",
       "                               'Pont': 2,\n",
       "                               'Maytag': 1,\n",
       "                               'Trojan': 1,\n",
       "                               'Steel': 5,\n",
       "                               'Valley': 12,\n",
       "                               'Queen': 1,\n",
       "                               'Cheese': 1,\n",
       "                               'Factory': 1,\n",
       "                               'Mayor': 2,\n",
       "                               'William': 23,\n",
       "                               'H.': 4,\n",
       "                               'Hudnut': 1,\n",
       "                               'III': 3,\n",
       "                               'Symphony': 1,\n",
       "                               'Orchestra': 1,\n",
       "                               'Victor': 2,\n",
       "                               'Borge': 1,\n",
       "                               'Speedway': 1,\n",
       "                               'Fortune': 1,\n",
       "                               'Indiana': 5,\n",
       "                               'Roof': 1,\n",
       "                               'February': 3,\n",
       "                               'South': 39,\n",
       "                               'Korea': 19,\n",
       "                               'October': 61,\n",
       "                               'Wednesday': 16,\n",
       "                               'Trade': 14,\n",
       "                               'Industry': 4,\n",
       "                               'Ministry': 10,\n",
       "                               'January': 12,\n",
       "                               'Newsweek': 10,\n",
       "                               'Time': 8,\n",
       "                               'Washington': 23,\n",
       "                               'Post': 1,\n",
       "                               'Warner': 3,\n",
       "                               'Mortimer': 1,\n",
       "                               'B.': 7,\n",
       "                               'Zuckerman': 1,\n",
       "                               'News': 6,\n",
       "                               'World': 13,\n",
       "                               'Alan': 3,\n",
       "                               'Spoon': 3,\n",
       "                               'mid-October': 1,\n",
       "                               'Circulation': 1,\n",
       "                               'Credit': 2,\n",
       "                               'Plan': 2,\n",
       "                               'Publishers': 1,\n",
       "                               'Information': 3,\n",
       "                               'Bureau': 2,\n",
       "                               'Audit': 1,\n",
       "                               'Circulations': 1,\n",
       "                               'Electric': 7,\n",
       "                               'System': 4,\n",
       "                               'Public': 4,\n",
       "                               'Service': 10,\n",
       "                               'Hampshire': 8,\n",
       "                               'United': 19,\n",
       "                               'Illuminating': 3,\n",
       "                               'Northeast': 7,\n",
       "                               'Utilities': 2,\n",
       "                               'PS': 7,\n",
       "                               'Westborough': 1,\n",
       "                               'Haven': 2,\n",
       "                               'Conn.': 7,\n",
       "                               'Hartford': 3,\n",
       "                               'Conn': 2,\n",
       "                               'Manchester': 1,\n",
       "                               'N.H.': 1,\n",
       "                               'John': 34,\n",
       "                               'Rowe': 5,\n",
       "                               'Wilbur': 1,\n",
       "                               'Ross': 5,\n",
       "                               'Jr.': 12,\n",
       "                               'Rothschild': 1,\n",
       "                               'Federal': 20,\n",
       "                               'Regulatory': 1,\n",
       "                               'Commission': 16,\n",
       "                               'FERC': 1,\n",
       "                               'York': 107,\n",
       "                               'Stock': 33,\n",
       "                               'Exchange': 50,\n",
       "                               'Norman': 2,\n",
       "                               'Ricken': 1,\n",
       "                               'R': 1,\n",
       "                               'Us': 1,\n",
       "                               'Frederick': 2,\n",
       "                               'Deane': 1,\n",
       "                               'Signet': 1,\n",
       "                               'Banking': 3,\n",
       "                               'Daniel': 2,\n",
       "                               'M.': 9,\n",
       "                               'Rexinger': 1,\n",
       "                               'Circuit': 2,\n",
       "                               'City': 16,\n",
       "                               'Robert': 24,\n",
       "                               'R.': 16,\n",
       "                               'Glauber': 1,\n",
       "                               'Commonwealth': 14,\n",
       "                               'Edison': 21,\n",
       "                               'Illinois': 4,\n",
       "                               'Commerce': 17,\n",
       "                               'Judge': 15,\n",
       "                               'Richard': 13,\n",
       "                               'Curry': 8,\n",
       "                               'April': 13,\n",
       "                               'Feb.': 2,\n",
       "                               'Dec.': 16,\n",
       "                               'Byron': 2,\n",
       "                               'Rockford': 2,\n",
       "                               'Ill.': 7,\n",
       "                               'Supreme': 9,\n",
       "                               'Court': 12,\n",
       "                               'Appellate': 1,\n",
       "                               'Braidwood': 3,\n",
       "                               'LaSalle': 1,\n",
       "                               'I': 2,\n",
       "                               'Japan': 75,\n",
       "                               'Automobile': 1,\n",
       "                               'September': 42,\n",
       "                               'March': 18,\n",
       "                               'Texas': 16,\n",
       "                               'Chinchon': 1,\n",
       "                               'Seoul': 4,\n",
       "                               'Cray': 36,\n",
       "                               'Computer': 13,\n",
       "                               'Seymour': 5,\n",
       "                               'Research': 21,\n",
       "                               'Cray-3': 8,\n",
       "                               'May': 12,\n",
       "                               'Gregory': 2,\n",
       "                               'Barnum': 3,\n",
       "                               'Gary': 4,\n",
       "                               'P.': 5,\n",
       "                               'Smaby': 2,\n",
       "                               'Group': 26,\n",
       "                               'Minneapolis': 5,\n",
       "                               'SEC': 6,\n",
       "                               'Business': 9,\n",
       "                               'Hitachi': 1,\n",
       "                               'NEC': 7,\n",
       "                               'Fujitsu': 13,\n",
       "                               'Ltd': 6,\n",
       "                               'Nasdaq': 6,\n",
       "                               'Colorado': 2,\n",
       "                               'Colo.': 5,\n",
       "                               'Messrs.': 1,\n",
       "                               'Neil': 2,\n",
       "                               'Davenport': 1,\n",
       "                               'Joseph': 3,\n",
       "                               'Blanchard': 1,\n",
       "                               'Malcolm': 2,\n",
       "                               'Hammerton': 1,\n",
       "                               'Douglas': 5,\n",
       "                               'Wheeland': 1,\n",
       "                               'Stevens': 2,\n",
       "                               'Donald': 6,\n",
       "                               'Pardus': 1,\n",
       "                               'Arthur': 3,\n",
       "                               'Hatch': 2,\n",
       "                               'Eastern': 5,\n",
       "                               'Carney': 1,\n",
       "                               'Tassinari': 1,\n",
       "                               'Taiwan': 8,\n",
       "                               'Saudi': 4,\n",
       "                               'Arabia': 3,\n",
       "                               'China': 25,\n",
       "                               'Thailand': 5,\n",
       "                               'India': 1,\n",
       "                               'Brazil': 9,\n",
       "                               'Mexico': 6,\n",
       "                               'Representative': 3,\n",
       "                               'Carla': 3,\n",
       "                               'Hills': 15,\n",
       "                               'Mrs.': 58,\n",
       "                               'Taipei': 3,\n",
       "                               'Italy': 3,\n",
       "                               'Canada': 7,\n",
       "                               'Greece': 1,\n",
       "                               'Spain': 4,\n",
       "                               'Hoffman': 1,\n",
       "                               'Turkey': 2,\n",
       "                               'Malaysia': 6,\n",
       "                               'Argentina': 2,\n",
       "                               'Economy': 1,\n",
       "                               'Minister': 4,\n",
       "                               'Nestor': 1,\n",
       "                               'Rapanelli': 4,\n",
       "                               'Latin': 1,\n",
       "                               'American': 38,\n",
       "                               'Miguel': 1,\n",
       "                               'Alurralde': 1,\n",
       "                               'Assistant': 1,\n",
       "                               'Secretary': 6,\n",
       "                               'David': 14,\n",
       "                               'Mulford': 1,\n",
       "                               'Carlos': 3,\n",
       "                               'Carballo': 1,\n",
       "                               'President': 28,\n",
       "                               'Menem': 1,\n",
       "                               'The': 4,\n",
       "                               'Wall': 37,\n",
       "                               'Street': 38,\n",
       "                               'Apple': 5,\n",
       "                               'II': 22,\n",
       "                               'Commodore': 1,\n",
       "                               'Pet': 1,\n",
       "                               'Tandy': 1,\n",
       "                               'TRS-80': 1,\n",
       "                               'Stephen': 6,\n",
       "                               'Wozniak': 1,\n",
       "                               'Steven': 2,\n",
       "                               'Jobs': 1,\n",
       "                               'Homebrew': 1,\n",
       "                               'Club': 1,\n",
       "                               'Altair': 1,\n",
       "                               'Sol': 1,\n",
       "                               'IMSAI': 1,\n",
       "                               'Gates': 2,\n",
       "                               'Paul': 5,\n",
       "                               'Allen': 3,\n",
       "                               'IBM': 6,\n",
       "                               'F.': 4,\n",
       "                               'Shugart': 1,\n",
       "                               'Seagate': 1,\n",
       "                               'Technology': 3,\n",
       "                               'Dennis': 2,\n",
       "                               'Hayes': 1,\n",
       "                               'Dale': 1,\n",
       "                               'Heatherington': 1,\n",
       "                               'Atlanta': 6,\n",
       "                               'F.H.': 1,\n",
       "                               'Faulding': 3,\n",
       "                               'Moleculon': 3,\n",
       "                               'Kalipharma': 2,\n",
       "                               'Purepac': 1,\n",
       "                               'Australia': 5,\n",
       "                               'Bass': 2,\n",
       "                               'Strait': 1,\n",
       "                               'Whiting': 4,\n",
       "                               'Esso': 2,\n",
       "                               'Exxon': 2,\n",
       "                               'Broken': 1,\n",
       "                               'Hill': 3,\n",
       "                               'Pty.': 1,\n",
       "                               'Perch': 1,\n",
       "                               'Dolphin': 1,\n",
       "                               'Seahorse': 1,\n",
       "                               'Tarwhine': 1,\n",
       "                               'R.P.': 2,\n",
       "                               'Scherer': 2,\n",
       "                               'Southern': 6,\n",
       "                               'Optical': 2,\n",
       "                               'Thomas': 14,\n",
       "                               'Sloan': 1,\n",
       "                               'Shearson': 16,\n",
       "                               'Lehman': 6,\n",
       "                               'Hutton': 6,\n",
       "                               'White': 17,\n",
       "                               'Bush': 44,\n",
       "                               'Virgin': 2,\n",
       "                               'Timex': 3,\n",
       "                               'Generalized': 1,\n",
       "                               'Philippines': 3,\n",
       "                               'Magna': 8,\n",
       "                               'McAlpine': 8,\n",
       "                               'Frank': 4,\n",
       "                               'Stronach': 5,\n",
       "                               'Akerfeldt': 1,\n",
       "                               'Class': 2,\n",
       "                               'A': 2,\n",
       "                               'Parliament': 3,\n",
       "                               'Manfred': 1,\n",
       "                               'Gingl': 1,\n",
       "                               'Lord': 2,\n",
       "                               'Chilver': 1,\n",
       "                               'English': 3,\n",
       "                               'Clays': 1,\n",
       "                               'Mortgage': 2,\n",
       "                               'Fannie': 4,\n",
       "                               'Mae': 6,\n",
       "                               'O.': 1,\n",
       "                               'Maxwell': 4,\n",
       "                               'France': 9,\n",
       "                               'Hong': 7,\n",
       "                               'Kong': 7,\n",
       "                               'Blackstone': 1,\n",
       "                               'Goldman': 7,\n",
       "                               'Sachs': 7,\n",
       "                               'Daiwa': 2,\n",
       "                               'Co': 16,\n",
       "                               'London': 26,\n",
       "                               'L.': 7,\n",
       "                               'Pate': 1,\n",
       "                               'LTV': 1,\n",
       "                               'Bankruptcy': 2,\n",
       "                               'Code': 2,\n",
       "                               'Montedison': 2,\n",
       "                               'S.p.A.': 1,\n",
       "                               'Acquisition': 6,\n",
       "                               'Erbamont': 1,\n",
       "                               'November': 9,\n",
       "                               'Finance': 9,\n",
       "                               'Bank': 32,\n",
       "                               'June': 14,\n",
       "                               'Charles': 10,\n",
       "                               'E.': 8,\n",
       "                               'Simon': 2,\n",
       "                               'Chile': 2,\n",
       "                               'Austria': 1,\n",
       "                               'Portugal': 1,\n",
       "                               'Philippine': 1,\n",
       "                               'Corazon': 1,\n",
       "                               'Aquino': 1,\n",
       "                               'the': 1,\n",
       "                               'Big': 33,\n",
       "                               'Board': 43,\n",
       "                               'Guinea': 3,\n",
       "                               'George': 5,\n",
       "                               'Foot': 3,\n",
       "                               'Newgate': 2,\n",
       "                               'Management': 12,\n",
       "                               'Associates': 1,\n",
       "                               'Northampton': 1,\n",
       "                               'Mass': 3,\n",
       "                               'Michael': 17,\n",
       "                               'Porter': 4,\n",
       "                               'Smith': 6,\n",
       "                               'Barney': 3,\n",
       "                               'Harris': 2,\n",
       "                               'Upham': 2,\n",
       "                               'Oct.': 25,\n",
       "                               'Asia': 14,\n",
       "                               'Europe': 10,\n",
       "                               'Soviet': 9,\n",
       "                               'Union': 21,\n",
       "                               'Moscow': 7,\n",
       "                               'State': 13,\n",
       "                               'Department': 42,\n",
       "                               'Foreign': 5,\n",
       "                               'Economic': 3,\n",
       "                               'Affairs': 2,\n",
       "                               'Kerensky': 1,\n",
       "                               'Johnson': 14,\n",
       "                               'Debt': 1,\n",
       "                               'Default': 1,\n",
       "                               'Act': 7,\n",
       "                               'Monetary': 2,\n",
       "                               'U.S.S.R.': 1,\n",
       "                               'War': 4,\n",
       "                               'Purchasing': 4,\n",
       "                               'Kenneth': 2,\n",
       "                               'Mayland': 1,\n",
       "                               'Society': 4,\n",
       "                               'Cleveland': 6,\n",
       "                               'Reserve': 7,\n",
       "                               'Elliott': 1,\n",
       "                               'Platt': 2,\n",
       "                               'Donaldson': 4,\n",
       "                               'Lufkin': 4,\n",
       "                               'Jenrette': 4,\n",
       "                               'Securities': 10,\n",
       "                               'Berson': 1,\n",
       "                               'Bankers': 3,\n",
       "                               'Government': 2,\n",
       "                               'McGraw-Hill': 6,\n",
       "                               'F.W.': 1,\n",
       "                               'Dodge': 4,\n",
       "                               'Bretz': 3,\n",
       "                               'Pitney': 1,\n",
       "                               'Bowes': 1,\n",
       "                               'Stamford': 3,\n",
       "                               'Pamela': 2,\n",
       "                               'Sebastian': 1,\n",
       "                               'Haruki': 1,\n",
       "                               'Murakami': 2,\n",
       "                               'Wild': 3,\n",
       "                               'Sheep': 4,\n",
       "                               'Chase': 6,\n",
       "                               'Kodansha': 2,\n",
       "                               'Salty': 1,\n",
       "                               'Dogs': 1,\n",
       "                               'Johnny': 1,\n",
       "                               'Goode': 1,\n",
       "                               'Bugs': 1,\n",
       "                               'Bunny': 1,\n",
       "                               'Mickey': 1,\n",
       "                               'Spillane': 1,\n",
       "                               'Groucho': 1,\n",
       "                               'Harpo': 1,\n",
       "                               'Stanford': 2,\n",
       "                               'God': 1,\n",
       "                               'Man': 2,\n",
       "                               'Norwegian': 1,\n",
       "                               'Wood': 3,\n",
       "                               'Beatles': 2,\n",
       "                               'Tokyo': 24,\n",
       "                               'Gotta': 2,\n",
       "                               'Have': 2,\n",
       "                               'Macmillan': 2,\n",
       "                               'Wa': 2,\n",
       "                               'Japanese': 5,\n",
       "                               'Giants': 2,\n",
       "                               'Tatsunori': 1,\n",
       "                               'Hara': 1,\n",
       "                               'Funny': 1,\n",
       "                               'Soho': 1,\n",
       "                               'Katzenstein': 5,\n",
       "                               'Sony': 13,\n",
       "                               'Luce': 1,\n",
       "                               'Fellowship': 1,\n",
       "                               'Walkman': 1,\n",
       "                               'Akio': 2,\n",
       "                               'Morita': 2,\n",
       "                               'Ms.': 14,\n",
       "                               'Kirkpatrick': 1,\n",
       "                               'Singapore': 4,\n",
       "                               'Siti': 1,\n",
       "                               'Zaharah': 1,\n",
       "                               'Sulaiman': 1,\n",
       "                               'No-Smoking': 1,\n",
       "                               'Week': 1,\n",
       "                               'Mara': 1,\n",
       "                               'Kuala': 1,\n",
       "                               'Lumpur': 1,\n",
       "                               'Backer': 1,\n",
       "                               'Spielvogel': 1,\n",
       "                               'Bates': 1,\n",
       "                               'Thai': 1,\n",
       "                               'Pramual': 1,\n",
       "                               'Sabhavasu': 1,\n",
       "                               'Bangkok': 1,\n",
       "                               'Central': 5,\n",
       "                               'Plaza': 1,\n",
       "                               'Hotel': 2,\n",
       "                               'Yasser': 1,\n",
       "                               'Arafat': 1,\n",
       "                               'Olympic': 3,\n",
       "                               'Committee': 12,\n",
       "                               'Palestine': 1,\n",
       "                               'Liberation': 1,\n",
       "                               'Organization': 3,\n",
       "                               'WAFA': 1,\n",
       "                               'Palestinian': 1,\n",
       "                               'PLO': 1,\n",
       "                               'Health': 12,\n",
       "                               'Tourism': 1,\n",
       "                               'Beijing': 7,\n",
       "                               'AIDS': 2,\n",
       "                               'People': 1,\n",
       "                               'Daily': 4,\n",
       "                               'PAP': 1,\n",
       "                               'Poland': 10,\n",
       "                               'Warsaw': 1,\n",
       "                               'Hungary': 4,\n",
       "                               'River': 10,\n",
       "                               'Danube': 1,\n",
       "                               'Nagymaros': 2,\n",
       "                               'Czechoslovakia': 5,\n",
       "                               'Prime': 3,\n",
       "                               'Miklos': 1,\n",
       "                               'Nemeth': 2,\n",
       "                               'Strindberg': 1,\n",
       "                               'Stockholm': 2,\n",
       "                               'Lighthouse': 1,\n",
       "                               'BRAMALEA': 1,\n",
       "                               'Scotia': 1,\n",
       "                               'McLeod': 1,\n",
       "                               'RBC': 1,\n",
       "                               'Dominion': 1,\n",
       "                               'Bramalea': 1,\n",
       "                               'Lane': 11,\n",
       "                               'Charlie': 1,\n",
       "                               'Chaplin': 4,\n",
       "                               'Steve': 1,\n",
       "                               'Martin': 10,\n",
       "                               'Little': 2,\n",
       "                               'Tramp': 5,\n",
       "                               'Purchase': 1,\n",
       "                               'Place': 1,\n",
       "                               'Artist': 8,\n",
       "                               'Sidewalk': 4,\n",
       "                               'Stories': 4,\n",
       "                               'Marc': 1,\n",
       "                               'Marder': 1,\n",
       "                               'Bill': 3,\n",
       "                               'Dill': 1,\n",
       "                               'Greenwich': 1,\n",
       "                               'Village': 1,\n",
       "                               'Sixth': 1,\n",
       "                               'Avenue': 2,\n",
       "                               'Cosmopolitan': 1,\n",
       "                               'Lights': 2,\n",
       "                               'Nicole': 1,\n",
       "                               'Alysia': 1,\n",
       "                               'Bowery': 1,\n",
       "                               'Mission': 1,\n",
       "                               'Claude': 1,\n",
       "                               'Chabrol': 2,\n",
       "                               'Story': 1,\n",
       "                               'Women': 1,\n",
       "                               'Marie-Louise': 3,\n",
       "                               'Giraud': 1,\n",
       "                               'Vichy': 2,\n",
       "                               'Resistance': 1,\n",
       "                               'Isabelle': 1,\n",
       "                               'Huppert': 1,\n",
       "                               'Marie': 1,\n",
       "                               'Latour': 2,\n",
       "                               'Old': 8,\n",
       "                               'Gringo': 1,\n",
       "                               'Fuentes': 1,\n",
       "                               'Mexican': 1,\n",
       "                               'Revolution': 1,\n",
       "                               'Peck': 1,\n",
       "                               'Video': 1,\n",
       "                               'Tip': 1,\n",
       "                               'Boeing': 2,\n",
       "                               'Seattle': 1,\n",
       "                               'Kawasaki': 1,\n",
       "                               'Heavy': 3,\n",
       "                               'Industries': 6,\n",
       "                               'Mitsubishi': 14,\n",
       "                               'Fuji': 1,\n",
       "                               'Napolitan': 1,\n",
       "                               'Jersey': 4,\n",
       "                               'Virginia': 4,\n",
       "                               'Dinkins': 11,\n",
       "                               'Republican': 1,\n",
       "                               'Giuliani': 5,\n",
       "                               'Roger': 2,\n",
       "                               'Ailes': 2,\n",
       "                               'Siegal': 1,\n",
       "                               'Shrum': 1,\n",
       "                               'Doak': 1,\n",
       "                               'Campaign': 1,\n",
       "                               'Peter': 10,\n",
       "                               'Powers': 1,\n",
       "                               'Lt.': 1,\n",
       "                               'Gov.': 2,\n",
       "                               'Wilder': 8,\n",
       "                               'Marshall': 6,\n",
       "                               'Coleman': 11,\n",
       "                               'Greer': 1,\n",
       "                               'Monticello': 1,\n",
       "                               'Jefferson': 1,\n",
       "                               'Bob': 7,\n",
       "                               'Goodman': 1,\n",
       "                               'Mark': 4,\n",
       "                               'Rozell': 1,\n",
       "                               'Mary': 11,\n",
       "                               'Rep.': 20,\n",
       "                               'Florio': 5,\n",
       "                               'Pinocchio': 3,\n",
       "                               'Jim': 4,\n",
       "                               'Courter': 10,\n",
       "                               'Squier': 1,\n",
       "                               'Salmore': 2,\n",
       "                               'Eagleton': 1,\n",
       "                               'Democrat': 5,\n",
       "                               \"O'Connor\": 2,\n",
       "                               'GOP': 2,\n",
       "                               'Nelson': 2,\n",
       "                               'Rockefeller': 5,\n",
       "                               'Chicago': 43,\n",
       "                               'Friday': 2,\n",
       "                               'Aug.': 2,\n",
       "                               'Southeast': 7,\n",
       "                               'Hormats': 3,\n",
       "                               'Investment': 8,\n",
       "                               'Drobnick': 1,\n",
       "                               'California': 26,\n",
       "                               'Graduate': 2,\n",
       "                               'School': 15,\n",
       "                               'European': 1,\n",
       "                               'Common': 1,\n",
       "                               'Market': 8,\n",
       "                               'Calder': 1,\n",
       "                               'Woodrow': 1,\n",
       "                               'Wilson': 1,\n",
       "                               'Internatonal': 1,\n",
       "                               'Princeton': 2,\n",
       "                               'Indonesia': 2,\n",
       "                               'Zealand': 1,\n",
       "                               'Asian': 1,\n",
       "                               'Brunei': 1,\n",
       "                               'Baker': 3,\n",
       "                               'Australian': 1,\n",
       "                               'Hawke': 1,\n",
       "                               'Farren': 1,\n",
       "                               'Chong-sik': 1,\n",
       "                               'Lee': 2,\n",
       "                               'Pennsylvania': 7,\n",
       "                               'Cathryn': 2,\n",
       "                               'Rice': 2,\n",
       "                               'Greenville': 13,\n",
       "                               'High': 20,\n",
       "                               'Germany': 8,\n",
       "                               'Nancy': 2,\n",
       "                               'Yeargin': 37,\n",
       "                               'Carolina': 13,\n",
       "                               'Education': 5,\n",
       "                               'Improvement': 2,\n",
       "                               'Walt': 1,\n",
       "                               'Haney': 1,\n",
       "                               'Albuquerque': 2,\n",
       "                               'N.M.': 2,\n",
       "                               'Macmillan\\\\/McGraw-Hill': 3,\n",
       "                               'Publishing': 4,\n",
       "                               'Scoring': 13,\n",
       "                               'Learning': 10,\n",
       "                               'County': 5,\n",
       "                               'Scholastic': 1,\n",
       "                               'Aptitude': 1,\n",
       "                               'Test': 4,\n",
       "                               'SAT': 1,\n",
       "                               'Cannell': 3,\n",
       "                               'Sandifer': 1,\n",
       "                               'Nobel': 1,\n",
       "                               'Prize': 1,\n",
       "                               'Townes': 1,\n",
       "                               'Joanne': 1,\n",
       "                               'Woodward': 1,\n",
       "                               'Linda': 2,\n",
       "                               'Ward': 13,\n",
       "                               'PTA': 1,\n",
       "                               'Laura': 1,\n",
       "                               'Dobson': 1,\n",
       "                               'Beth': 4,\n",
       "                               'Marchand': 2,\n",
       "                               'Kelli': 1,\n",
       "                               'Green': 1,\n",
       "                               'Elizabeth': 2,\n",
       "                               'Ariail': 1,\n",
       "                               'Joe': 2,\n",
       "                               'Watson': 4,\n",
       "                               'Mrs': 1,\n",
       "                               'GHS': 1,\n",
       "                               'Gayle': 1,\n",
       "                               'Key': 2,\n",
       "                               'Achievement': 3,\n",
       "                               'Britain': 9,\n",
       "                               'Communication': 1,\n",
       "                               'Kaminski': 4,\n",
       "                               'Traverse': 1,\n",
       "                               'Mich.': 5,\n",
       "                               'Macmillan\\\\/McGraw': 4,\n",
       "                               'CAT': 6,\n",
       "                               'Comprehensive': 5,\n",
       "                               'Iowa': 10,\n",
       "                               'Houghton': 1,\n",
       "                               'Mifflin': 1,\n",
       "                               'Harcourt': 1,\n",
       "                               'Brace': 1,\n",
       "                               'Jovanovich': 1,\n",
       "                               'Metropolitan': 1,\n",
       "                               'Arizona': 1,\n",
       "                               'Florida': 2,\n",
       "                               'Louisiana': 1,\n",
       "                               'Maryland': 2,\n",
       "                               'Kean': 2,\n",
       "                               'CTB': 1,\n",
       "                               'Mehrens': 2,\n",
       "                               'Michigan': 3,\n",
       "                               'Rick': 2,\n",
       "                               'Brownell': 2,\n",
       "                               'Random': 12,\n",
       "                               'CTBS': 1,\n",
       "                               'Alleghany': 2,\n",
       "                               'Sacramento': 3,\n",
       "                               'Loan': 6,\n",
       "                               'H.N.': 1,\n",
       "                               'Frances': 1,\n",
       "                               'C.': 10,\n",
       "                               'Berger': 1,\n",
       "                               'Foundation': 3,\n",
       "                               'Human': 3,\n",
       "                               'Alzheimer': 2,\n",
       "                               'Parkinson': 1,\n",
       "                               'Huntington': 1,\n",
       "                               'Mason': 7,\n",
       "                               'HHS': 3,\n",
       "                               'Louis': 11,\n",
       "                               'Sullivan': 5,\n",
       "                               'NIH': 4,\n",
       "                               'Disease': 1,\n",
       "                               'Control': 1,\n",
       "                               'Antonio': 3,\n",
       "                               'Novello': 2,\n",
       "                               'Child': 1,\n",
       "                               'Development': 5,\n",
       "                               'CDC': 1,\n",
       "                               'Myron': 1,\n",
       "                               'Genel': 2,\n",
       "                               'Yale': 2,\n",
       "                               'Medical': 3,\n",
       "                               'Down': 1,\n",
       "                               'Connecticut': 7,\n",
       "                               'Trust': 4,\n",
       "                               'Massachusetts': 7,\n",
       "                               'Jennison': 2,\n",
       "                               'OTC': 3,\n",
       "                               'Bancorp': 3,\n",
       "                               'Ed': 2,\n",
       "                               'Macheski': 1,\n",
       "                               'Wilton': 1,\n",
       "                               'Constitution': 12,\n",
       "                               'WFRR': 1,\n",
       "                               'L.P.': 1,\n",
       "                               'GHKM': 1,\n",
       "                               'Centerbank': 1,\n",
       "                               'NESB': 1,\n",
       "                               'Pennview': 1,\n",
       "                               'Univest': 1,\n",
       "                               'Dan': 2,\n",
       "                               'Nelms': 1,\n",
       "                               'Weisfield': 5,\n",
       "                               'Ratners': 9,\n",
       "                               'Jaguar': 4,\n",
       "                               'Heritage': 10,\n",
       "                               'Media': 5,\n",
       "                               'POP': 9,\n",
       "                               'Radio': 6,\n",
       "                               'Rally': 8,\n",
       "                               'Giant': 4,\n",
       "                               'Burt': 2,\n",
       "                               'Sugarman': 2,\n",
       "                               'Trotter': 4,\n",
       "                               'SCI': 3,\n",
       "                               'Systems': 1,\n",
       "                               'Huntsville': 1,\n",
       "                               'Ala.': 1,\n",
       "                               'Sept.': 12,\n",
       "                               'Internal': 1,\n",
       "                               'Revenue': 1,\n",
       "                               'IRS': 14,\n",
       "                               'Social': 1,\n",
       "                               'Security': 2,\n",
       "                               'Neal': 2,\n",
       "                               'Sonnett': 4,\n",
       "                               'Criminal': 1,\n",
       "                               'Defense': 2,\n",
       "                               'Miami': 8,\n",
       "                               'Gerald': 3,\n",
       "                               'Lefcourt': 1,\n",
       "                               'Bar': 2,\n",
       "                               'ABA': 6,\n",
       "                               'Justice': 12,\n",
       "                               'Christopher': 4,\n",
       "                               'Lezovich': 1,\n",
       "                               'Detroit': 4,\n",
       "                               'Raul': 1,\n",
       "                               'Ramirez': 2,\n",
       "                               'Calif': 3,\n",
       "                               'San': 19,\n",
       "                               'Francisco': 14,\n",
       "                               'Orrick': 1,\n",
       "                               'Herrington': 1,\n",
       "                               'Sutcliffe': 1,\n",
       "                               'DOONESBURY': 1,\n",
       "                               'Garry': 1,\n",
       "                               'Trudeau': 7,\n",
       "                               'Guild': 2,\n",
       "                               'America': 21,\n",
       "                               'East': 7,\n",
       "                               'Darkhorse': 3,\n",
       "                               'K.': 4,\n",
       "                               'Samnick': 3,\n",
       "                               'X': 2,\n",
       "                               'Second': 2,\n",
       "                               'TEXAS': 1,\n",
       "                               'Dallas': 7,\n",
       "                               'District': 3,\n",
       "                               'Jack': 5,\n",
       "                               'Hampton': 3,\n",
       "                               'December': 14,\n",
       "                               'Murray': 6,\n",
       "                               'Judicial': 1,\n",
       "                               'Conduct': 1,\n",
       "                               'GAF': 5,\n",
       "                               'Manhattan': 4,\n",
       "                               'Lowe': 1,\n",
       "                               'Wayne': 2,\n",
       "                               'N.J.': 7,\n",
       "                               'Vice': 1,\n",
       "                               'Chairman': 12,\n",
       "                               'Sherwin': 1,\n",
       "                               'Carbide': 1,\n",
       "                               'Iran\\\\/Contra': 1,\n",
       "                               'Mayer': 1,\n",
       "                               'Brown': 2,\n",
       "                               'Bromwich': 2,\n",
       "                               'Oliver': 2,\n",
       "                               'North': 2,\n",
       "                               'D.C.': 4,\n",
       "                               'Cooper': 2,\n",
       "                               'Tire': 1,\n",
       "                               'Rubber': 1,\n",
       "                               'Albany': 1,\n",
       "                               'Ga.': 2,\n",
       "                               'Bridgestone\\\\/Firestone': 2,\n",
       "                               'Inc': 19,\n",
       "                               'Fair': 2,\n",
       "                               'Takuma': 2,\n",
       "                               'Yamamoto': 5,\n",
       "                               'Machines': 1,\n",
       "                               'Hiroshima': 2,\n",
       "                               'Nagano': 2,\n",
       "                               'Saitama': 1,\n",
       "                               'Wakayama': 1,\n",
       "                               'Michio': 1,\n",
       "                               'Sasaki': 1,\n",
       "                               'Keidanren': 1,\n",
       "                               'Federation': 1,\n",
       "                               'Organizations': 1,\n",
       "                               'Backe': 3,\n",
       "                               'Atlantic': 2,\n",
       "                               'Publications': 1,\n",
       "                               'CBS': 2,\n",
       "                               'Price': 5,\n",
       "                               'Communications': 2,\n",
       "                               'NTG': 2,\n",
       "                               'Osborn': 1,\n",
       "                               'Desai': 1,\n",
       "                               'Capital': 10,\n",
       "                               'Michaels': 1,\n",
       "                               'Stores': 1,\n",
       "                               'Furukawa': 2,\n",
       "                               'Dresser': 2,\n",
       "                               'Heidelberg': 1,\n",
       "                               'Structural': 2,\n",
       "                               'Dynamics': 1,\n",
       "                               'Deposits-a': 1,\n",
       "                               'Rate': 1,\n",
       "                               'Monitor': 1,\n",
       "                               'LSI': 1,\n",
       "                               'Logic': 1,\n",
       "                               'Wilfred': 1,\n",
       "                               'Corrigan': 1,\n",
       "                               'Santa': 6,\n",
       "                               'Clara': 1,\n",
       "                               'Calif.': 16,\n",
       "                               'Stark': 1,\n",
       "                               'Robertson': 1,\n",
       "                               'Stephens': 1,\n",
       "                               'INGERSOLL-RAND': 1,\n",
       "                               'Woodcliff': 1,\n",
       "                               'Lake': 4,\n",
       "                               'N.J': 5,\n",
       "                               'G.': 7,\n",
       "                               'Kuhns': 1,\n",
       "                               'General': 14,\n",
       "                               'Jay': 2,\n",
       "                               'Goldinger': 1,\n",
       "                               'Insight': 1,\n",
       "                               'Tom': 2,\n",
       "                               'Trettien': 1,\n",
       "                               'Banque': 1,\n",
       "                               'Paribas': 1,\n",
       "                               'Thursday': 9,\n",
       "                               'Madison': 5,\n",
       "                               'Los': 13,\n",
       "                               'Angeles': 12,\n",
       "                               'Columbia': 37,\n",
       "                               'Pictures': 3,\n",
       "                               'Entertainment': 5,\n",
       "                               'Estate': 4,\n",
       "                               'Georgia-Pacific': 11,\n",
       "                               'Northern': 4,\n",
       "                               'Nekoosa': 9,\n",
       "                               'Commodity': 3,\n",
       "                               'Cosby': 9,\n",
       "                               'Show': 1,\n",
       "                               'NBC': 2,\n",
       "                               'Huxtable': 1,\n",
       "                               'Viacom': 7,\n",
       "                               'Different': 1,\n",
       "                               'Gillespie': 2,\n",
       "                               'A.C.': 1,\n",
       "                               'Nielsen': 1,\n",
       "                               'Providence': 2,\n",
       "                               'R.I.': 1,\n",
       "                               'Raleigh': 1,\n",
       "                               'N.C.': 3,\n",
       "                               'Louisville': 2,\n",
       "                               'Ky.': 1,\n",
       "                               'Dick': 1,\n",
       "                               'Lobo': 1,\n",
       "                               ...}),\n",
       "                     'NNPS': FreqDist({'ADRs': 2,\n",
       "                               'ASSETS': 1,\n",
       "                               'ASSOCIATES': 1,\n",
       "                               'Airlines': 5,\n",
       "                               'Airways': 1,\n",
       "                               'Americans': 6,\n",
       "                               'Angels': 1,\n",
       "                               'Appeals': 1,\n",
       "                               'Appropriations': 1,\n",
       "                               'Articles': 1,\n",
       "                               'Asians': 1,\n",
       "                               'Associates': 5,\n",
       "                               'BILLS': 1,\n",
       "                               'BRIEFS': 1,\n",
       "                               'Bricklayers': 1,\n",
       "                               'Bridges': 1,\n",
       "                               'Brothers': 3,\n",
       "                               'Builders': 1,\n",
       "                               'Burgundies': 2,\n",
       "                               'Cabernets': 2,\n",
       "                               'Centers': 1,\n",
       "                               'Chardonnays': 1,\n",
       "                               'Charities': 1,\n",
       "                               'Communications': 4,\n",
       "                               'Containers': 16,\n",
       "                               'Contracts': 1,\n",
       "                               'Contras': 2,\n",
       "                               'Craftsmen': 1,\n",
       "                               'Dakotas': 1,\n",
       "                               'Dealers': 2,\n",
       "                               'Delegates': 1,\n",
       "                               'Democrats': 5,\n",
       "                               'Dolphins': 1,\n",
       "                               'Donuts': 1,\n",
       "                               'Elders': 1,\n",
       "                               'Engineers': 2,\n",
       "                               'F-series': 1,\n",
       "                               'FUNDS': 1,\n",
       "                               'Facilities': 1,\n",
       "                               'Foods': 1,\n",
       "                               'Friends': 3,\n",
       "                               'Fundamentalists': 1,\n",
       "                               'Futures': 2,\n",
       "                               'GRAINS': 1,\n",
       "                               'Germans': 1,\n",
       "                               'Giants': 3,\n",
       "                               'Holdings': 1,\n",
       "                               'Industries': 12,\n",
       "                               'Inns': 1,\n",
       "                               'Institutes': 2,\n",
       "                               'Instruments': 2,\n",
       "                               'Investments': 1,\n",
       "                               'Investors': 3,\n",
       "                               'Islands': 2,\n",
       "                               'Issues': 3,\n",
       "                               'Journals': 1,\n",
       "                               'Laboratories': 2,\n",
       "                               'Lakes': 1,\n",
       "                               'Lawmakers': 1,\n",
       "                               'Lawyers': 1,\n",
       "                               'Lines': 1,\n",
       "                               'METALS': 1,\n",
       "                               'Machines': 3,\n",
       "                               'Manufacturers': 1,\n",
       "                               'Markets': 4,\n",
       "                               'Materials': 10,\n",
       "                               'Mercedes': 1,\n",
       "                               'Mergers': 1,\n",
       "                               'Messrs.': 2,\n",
       "                               'Monopolies': 1,\n",
       "                               'Motors': 5,\n",
       "                               'Nations': 2,\n",
       "                               'Netherlands': 1,\n",
       "                               'Notes': 1,\n",
       "                               'Operations': 1,\n",
       "                               'Options': 2,\n",
       "                               'Parkinson': 1,\n",
       "                               'Partners': 3,\n",
       "                               'Philippines': 3,\n",
       "                               'Pictures': 1,\n",
       "                               'Plains': 1,\n",
       "                               'Preferences': 1,\n",
       "                               'Productions': 1,\n",
       "                               'Products': 1,\n",
       "                               'Publications': 1,\n",
       "                               'RATES': 1,\n",
       "                               'Republicans': 1,\n",
       "                               'Resources': 4,\n",
       "                               'Rieslings': 1,\n",
       "                               'SOYBEANS': 1,\n",
       "                               'Savings': 5,\n",
       "                               'Securities': 16,\n",
       "                               'Services': 4,\n",
       "                               'Soviets': 8,\n",
       "                               'Springs': 1,\n",
       "                               'States': 5,\n",
       "                               'Stores': 3,\n",
       "                               'Systems': 4,\n",
       "                               'Tots': 1,\n",
       "                               'Toys': 1,\n",
       "                               'Travelers': 4,\n",
       "                               'Underwoods': 1,\n",
       "                               'Utilities': 1,\n",
       "                               'Virginians': 1,\n",
       "                               'Works': 1,\n",
       "                               'Writers': 2,\n",
       "                               'Yorkers': 1}),\n",
       "                     'NNS': FreqDist({'years': 115,\n",
       "                               'filters': 7,\n",
       "                               'deaths': 6,\n",
       "                               'workers': 20,\n",
       "                               'researchers': 13,\n",
       "                               'lungs': 1,\n",
       "                               'exposures': 3,\n",
       "                               'symptoms': 1,\n",
       "                               'decades': 3,\n",
       "                               'cigarettes': 6,\n",
       "                               'findings': 8,\n",
       "                               'results': 21,\n",
       "                               'properties': 1,\n",
       "                               'products': 32,\n",
       "                               'smokers': 2,\n",
       "                               'users': 2,\n",
       "                               'schools': 9,\n",
       "                               'amounts': 5,\n",
       "                               'men': 10,\n",
       "                               'times': 16,\n",
       "                               'diseases': 7,\n",
       "                               'countries': 21,\n",
       "                               'buildings': 3,\n",
       "                               'nations': 15,\n",
       "                               'fibers': 4,\n",
       "                               'amphobiles': 1,\n",
       "                               'uses': 4,\n",
       "                               'Areas': 1,\n",
       "                               'Workers': 2,\n",
       "                               'sacks': 1,\n",
       "                               'clouds': 1,\n",
       "                               'parts': 7,\n",
       "                               'fans': 2,\n",
       "                               'managers': 40,\n",
       "                               'resources': 5,\n",
       "                               'events': 3,\n",
       "                               'Yields': 1,\n",
       "                               'funds': 67,\n",
       "                               'signs': 8,\n",
       "                               'declines': 5,\n",
       "                               'rates': 49,\n",
       "                               'yields': 7,\n",
       "                               'dividends': 21,\n",
       "                               'investments': 17,\n",
       "                               'days': 51,\n",
       "                               'maturities': 3,\n",
       "                               'institutions': 18,\n",
       "                               'rises': 1,\n",
       "                               'bills': 19,\n",
       "                               'investors': 63,\n",
       "                               'Assets': 1,\n",
       "                               'securities': 33,\n",
       "                               'fees': 19,\n",
       "                               'seats': 7,\n",
       "                               'shareholders': 20,\n",
       "                               'interests': 7,\n",
       "                               'controls': 3,\n",
       "                               'systems': 6,\n",
       "                               'people': 56,\n",
       "                               'sales': 59,\n",
       "                               'savings': 10,\n",
       "                               'bonds': 59,\n",
       "                               'obligations': 2,\n",
       "                               'taxes': 4,\n",
       "                               'operations': 29,\n",
       "                               'titans': 1,\n",
       "                               'confines': 1,\n",
       "                               'towns': 2,\n",
       "                               'guests': 3,\n",
       "                               'stars': 2,\n",
       "                               'owners': 4,\n",
       "                               'makers': 12,\n",
       "                               'officials': 47,\n",
       "                               'giants': 2,\n",
       "                               'knowns': 1,\n",
       "                               'starters': 1,\n",
       "                               'executives': 19,\n",
       "                               'busloads': 1,\n",
       "                               'wives': 1,\n",
       "                               'lights': 2,\n",
       "                               'drinks': 1,\n",
       "                               'visitors': 2,\n",
       "                               'drivers': 3,\n",
       "                               'crews': 1,\n",
       "                               'schoolboys': 1,\n",
       "                               'cars': 19,\n",
       "                               'dummies': 1,\n",
       "                               'machines': 2,\n",
       "                               'execs': 1,\n",
       "                               'meetings': 6,\n",
       "                               'buses': 3,\n",
       "                               'moons': 1,\n",
       "                               'chefs': 2,\n",
       "                               'CEOs': 2,\n",
       "                               'figures': 12,\n",
       "                               'tallies': 1,\n",
       "                               'Exports': 1,\n",
       "                               'imports': 12,\n",
       "                               'disputes': 3,\n",
       "                               'conflicts': 2,\n",
       "                               'exports': 11,\n",
       "                               'Imports': 3,\n",
       "                               'advertisers': 13,\n",
       "                               'Plans': 2,\n",
       "                               'discounts': 1,\n",
       "                               'fixtures': 1,\n",
       "                               'weeklies': 2,\n",
       "                               'credits': 2,\n",
       "                               'bonuses': 2,\n",
       "                               'pages': 8,\n",
       "                               'months': 59,\n",
       "                               'giveaways': 1,\n",
       "                               'subscribers': 1,\n",
       "                               'telephones': 1,\n",
       "                               'watches': 7,\n",
       "                               'gains': 21,\n",
       "                               'risks': 11,\n",
       "                               'bidders': 3,\n",
       "                               'proceedings': 5,\n",
       "                               'places': 4,\n",
       "                               'forecasts': 4,\n",
       "                               'efficiencies': 1,\n",
       "                               'rewards': 2,\n",
       "                               'concerns': 13,\n",
       "                               'factors': 7,\n",
       "                               'holders': 14,\n",
       "                               'increases': 13,\n",
       "                               'boosts': 1,\n",
       "                               'negotiations': 3,\n",
       "                               'shares': 114,\n",
       "                               'cents': 70,\n",
       "                               'directors': 7,\n",
       "                               'electronics': 10,\n",
       "                               'appliances': 5,\n",
       "                               'ratepayers': 1,\n",
       "                               'overruns': 1,\n",
       "                               'groups': 10,\n",
       "                               'refunds': 2,\n",
       "                               'customers': 23,\n",
       "                               'appeals': 4,\n",
       "                               'attempts': 2,\n",
       "                               'collections': 2,\n",
       "                               'earnings': 38,\n",
       "                               'addresses': 1,\n",
       "                               'courts': 7,\n",
       "                               'expenses': 8,\n",
       "                               'calculations': 1,\n",
       "                               'trucks': 15,\n",
       "                               'units': 12,\n",
       "                               'records': 5,\n",
       "                               'Sales': 19,\n",
       "                               'reductions': 4,\n",
       "                               'devices': 7,\n",
       "                               'miles': 4,\n",
       "                               'vehicles': 6,\n",
       "                               'Documents': 1,\n",
       "                               'documents': 5,\n",
       "                               'orders': 28,\n",
       "                               'prospects': 7,\n",
       "                               'strings': 2,\n",
       "                               'details': 6,\n",
       "                               'Analysts': 9,\n",
       "                               'chips': 5,\n",
       "                               'processors': 3,\n",
       "                               'supercomputers': 2,\n",
       "                               'terms': 18,\n",
       "                               'stockholders': 3,\n",
       "                               'weeks': 22,\n",
       "                               'companies': 63,\n",
       "                               'assets': 17,\n",
       "                               'sheets': 3,\n",
       "                               'positions': 5,\n",
       "                               'patents': 4,\n",
       "                               'copyrights': 1,\n",
       "                               'rights': 20,\n",
       "                               'investigations': 1,\n",
       "                               'sanctions': 5,\n",
       "                               'degrees': 4,\n",
       "                               'citizens': 1,\n",
       "                               'negotiators': 2,\n",
       "                               'protections': 1,\n",
       "                               'scientists': 7,\n",
       "                               'authors': 5,\n",
       "                               'firms': 34,\n",
       "                               'teams': 3,\n",
       "                               'officers': 2,\n",
       "                               'prosecutors': 3,\n",
       "                               'pirates': 1,\n",
       "                               'procedures': 3,\n",
       "                               'producers': 6,\n",
       "                               'showings': 1,\n",
       "                               'films': 3,\n",
       "                               'parlors': 1,\n",
       "                               'standards': 9,\n",
       "                               'works': 5,\n",
       "                               'problems': 28,\n",
       "                               'cases': 22,\n",
       "                               'improvements': 1,\n",
       "                               'efforts': 11,\n",
       "                               'developments': 1,\n",
       "                               'reports': 13,\n",
       "                               'banks': 51,\n",
       "                               'milestones': 1,\n",
       "                               'COMPUTERS': 1,\n",
       "                               'computers': 15,\n",
       "                               'sets': 4,\n",
       "                               'screens': 2,\n",
       "                               'data': 12,\n",
       "                               'audiocassettes': 1,\n",
       "                               'hobbyists': 1,\n",
       "                               'PCs': 6,\n",
       "                               'models': 5,\n",
       "                               'types': 6,\n",
       "                               'keyboards': 1,\n",
       "                               'memories': 2,\n",
       "                               'counterparts': 2,\n",
       "                               'contributors': 1,\n",
       "                               'versions': 2,\n",
       "                               'drives': 2,\n",
       "                               'engineers': 2,\n",
       "                               'co-developers': 1,\n",
       "                               'modems': 1,\n",
       "                               'shipments': 5,\n",
       "                               'pharmaceuticals': 3,\n",
       "                               'holdings': 3,\n",
       "                               'fields': 11,\n",
       "                               'barrels': 7,\n",
       "                               'reserves': 9,\n",
       "                               'Reserves': 2,\n",
       "                               'capsules': 1,\n",
       "                               'businesses': 10,\n",
       "                               'quantities': 2,\n",
       "                               'possessions': 1,\n",
       "                               'changes': 15,\n",
       "                               'classifications': 1,\n",
       "                               'categories': 1,\n",
       "                               'preferences': 1,\n",
       "                               'beneficiaries': 1,\n",
       "                               'dollars': 17,\n",
       "                               'costs': 22,\n",
       "                               'clients': 18,\n",
       "                               'purchases': 9,\n",
       "                               'instruments': 5,\n",
       "                               'advantages': 2,\n",
       "                               'payments': 21,\n",
       "                               'purchasers': 2,\n",
       "                               'members': 26,\n",
       "                               'creditors': 6,\n",
       "                               'lawsuits': 2,\n",
       "                               'debts': 6,\n",
       "                               'editions': 1,\n",
       "                               'currencies': 2,\n",
       "                               'yen': 15,\n",
       "                               'portfolios': 5,\n",
       "                               'stocks': 66,\n",
       "                               'regulators': 14,\n",
       "                               '1920s': 1,\n",
       "                               'billions': 3,\n",
       "                               'People': 5,\n",
       "                               'claims': 3,\n",
       "                               'brokers': 6,\n",
       "                               'nets': 1,\n",
       "                               'planners': 2,\n",
       "                               'markets': 52,\n",
       "                               'gyrations': 6,\n",
       "                               'prices': 86,\n",
       "                               'premiums': 3,\n",
       "                               'specialists': 7,\n",
       "                               'valuations': 1,\n",
       "                               'analysts': 30,\n",
       "                               'levels': 13,\n",
       "                               'receipts': 3,\n",
       "                               'folks': 3,\n",
       "                               'talks': 18,\n",
       "                               'Soviets': 2,\n",
       "                               'Communists': 1,\n",
       "                               'Americans': 3,\n",
       "                               'obstacles': 2,\n",
       "                               'hundreds': 2,\n",
       "                               'millions': 6,\n",
       "                               'goods': 13,\n",
       "                               'Factories': 1,\n",
       "                               'contractors': 1,\n",
       "                               'effects': 3,\n",
       "                               'patterns': 3,\n",
       "                               'measures': 5,\n",
       "                               'payrolls': 2,\n",
       "                               'economists': 5,\n",
       "                               'imbalances': 2,\n",
       "                               'signals': 1,\n",
       "                               'Inventories': 1,\n",
       "                               'clues': 2,\n",
       "                               'Economists': 2,\n",
       "                               'inventories': 6,\n",
       "                               'cutbacks': 5,\n",
       "                               'Orders': 1,\n",
       "                               'durable-goods': 1,\n",
       "                               'Shipments': 1,\n",
       "                               'Manufacturers': 1,\n",
       "                               'backlogs': 2,\n",
       "                               'homes': 3,\n",
       "                               'contracts': 24,\n",
       "                               'materials': 16,\n",
       "                               'vendors': 1,\n",
       "                               'pressures': 7,\n",
       "                               'suppliers': 3,\n",
       "                               'indicators': 5,\n",
       "                               'Items': 1,\n",
       "                               'quotas': 2,\n",
       "                               'manufacturers': 6,\n",
       "                               'Americana': 2,\n",
       "                               'boomers': 1,\n",
       "                               'sides': 9,\n",
       "                               'Characters': 1,\n",
       "                               'reruns': 4,\n",
       "                               'careers': 2,\n",
       "                               'marriages': 2,\n",
       "                               'affairs': 6,\n",
       "                               'writers': 2,\n",
       "                               'outsiders': 1,\n",
       "                               'relations': 9,\n",
       "                               'Japanese': 4,\n",
       "                               'retorts': 1,\n",
       "                               'lyrics': 1,\n",
       "                               'copies': 5,\n",
       "                               'charts': 1,\n",
       "                               'books': 5,\n",
       "                               'dashes': 1,\n",
       "                               'virtues': 1,\n",
       "                               'ballplayers': 3,\n",
       "                               'Polls': 1,\n",
       "                               'Fans': 1,\n",
       "                               'balls': 1,\n",
       "                               'ushers': 1,\n",
       "                               'ties': 6,\n",
       "                               'players': 5,\n",
       "                               'rules': 8,\n",
       "                               'lives': 4,\n",
       "                               'sums': 2,\n",
       "                               'parties': 6,\n",
       "                               'passages': 1,\n",
       "                               'aspects': 1,\n",
       "                               'employees': 20,\n",
       "                               'partners': 7,\n",
       "                               'observations': 1,\n",
       "                               'salarymen': 1,\n",
       "                               'features': 4,\n",
       "                               'corners': 1,\n",
       "                               'restaurants': 3,\n",
       "                               'stores': 9,\n",
       "                               'sports': 3,\n",
       "                               'centers': 2,\n",
       "                               'Discos': 1,\n",
       "                               'clubs': 2,\n",
       "                               'bars': 1,\n",
       "                               'hours': 9,\n",
       "                               'theaters': 1,\n",
       "                               'elevators': 6,\n",
       "                               'hospitals': 1,\n",
       "                               'stalls': 1,\n",
       "                               'posters': 1,\n",
       "                               'signboards': 1,\n",
       "                               'consumers': 10,\n",
       "                               'values': 2,\n",
       "                               'conditions': 18,\n",
       "                               'organizations': 3,\n",
       "                               'tests': 16,\n",
       "                               'associates': 2,\n",
       "                               'charges': 15,\n",
       "                               'loans': 10,\n",
       "                               'environmentalists': 2,\n",
       "                               'dams': 1,\n",
       "                               'periods': 2,\n",
       "                               'oils': 1,\n",
       "                               'weddings': 2,\n",
       "                               'couples': 1,\n",
       "                               'rings': 1,\n",
       "                               'statistics': 3,\n",
       "                               'debentures': 7,\n",
       "                               'warrants': 5,\n",
       "                               'underwriters': 3,\n",
       "                               'dealers': 15,\n",
       "                               'streets': 7,\n",
       "                               'ensembles': 1,\n",
       "                               'characters': 1,\n",
       "                               'intertitles': 1,\n",
       "                               'words': 4,\n",
       "                               'women': 15,\n",
       "                               'cabs': 1,\n",
       "                               'jugglers': 1,\n",
       "                               'magicians': 1,\n",
       "                               'hustlers': 1,\n",
       "                               'passers-by': 1,\n",
       "                               'skirmishes': 1,\n",
       "                               'thugs': 1,\n",
       "                               'beds': 1,\n",
       "                               'stakes': 2,\n",
       "                               'children': 7,\n",
       "                               'voices': 2,\n",
       "                               'Germans': 1,\n",
       "                               'thousands': 4,\n",
       "                               'fighters': 1,\n",
       "                               'Jews': 1,\n",
       "                               'goodies': 1,\n",
       "                               'scenes': 3,\n",
       "                               'movies': 1,\n",
       "                               'plans': 15,\n",
       "                               'discussions': 7,\n",
       "                               'stages': 3,\n",
       "                               'sections': 2,\n",
       "                               'mid-1990s': 1,\n",
       "                               'campaigns': 4,\n",
       "                               'contests': 2,\n",
       "                               'ads': 8,\n",
       "                               'fears': 3,\n",
       "                               'issues': 36,\n",
       "                               'stirrings': 1,\n",
       "                               'politics': 4,\n",
       "                               'fights': 1,\n",
       "                               'commercials': 1,\n",
       "                               'elections': 7,\n",
       "                               'contributions': 1,\n",
       "                               'links': 2,\n",
       "                               'innuendoes': 1,\n",
       "                               'consultants': 2,\n",
       "                               'photos': 1,\n",
       "                               'politicians': 6,\n",
       "                               'candidates': 9,\n",
       "                               'bullets': 3,\n",
       "                               'errors': 1,\n",
       "                               'reservations': 2,\n",
       "                               'generations': 1,\n",
       "                               'dynamics': 2,\n",
       "                               'advertisements': 2,\n",
       "                               'shadows': 1,\n",
       "                               'boyfriends': 1,\n",
       "                               'victims': 8,\n",
       "                               'lawyers': 14,\n",
       "                               'rapists': 1,\n",
       "                               'lawmakers': 3,\n",
       "                               'stations': 10,\n",
       "                               'questions': 22,\n",
       "                               'attacks': 3,\n",
       "                               'Pictures': 1,\n",
       "                               'drums': 1,\n",
       "                               'neighbors': 1,\n",
       "                               'partisans': 2,\n",
       "                               'photographs': 2,\n",
       "                               'Barrels': 1,\n",
       "                               'Seats': 1,\n",
       "                               'Interviews': 1,\n",
       "                               'fits': 1,\n",
       "                               'starts': 1,\n",
       "                               'economies': 3,\n",
       "                               'commitments': 8,\n",
       "                               'wages': 2,\n",
       "                               'sites': 1,\n",
       "                               'tigers': 1,\n",
       "                               'jobs': 14,\n",
       "                               'constraints': 2,\n",
       "                               'burdens': 1,\n",
       "                               '1990s': 1,\n",
       "                               'multinationals': 1,\n",
       "                               'plants': 12,\n",
       "                               'decisions': 4,\n",
       "                               'sectors': 1,\n",
       "                               'tubes': 1,\n",
       "                               'Countries': 1,\n",
       "                               'ministers': 1,\n",
       "                               'matters': 2,\n",
       "                               'Participants': 1,\n",
       "                               'friends': 3,\n",
       "                               'flows': 2,\n",
       "                               'functions': 3,\n",
       "                               'leases': 2,\n",
       "                               'bases': 3,\n",
       "                               'marbles': 1,\n",
       "                               'eyes': 2,\n",
       "                               'Skills': 3,\n",
       "                               'graders': 3,\n",
       "                               'notes': 29,\n",
       "                               'forms': 8,\n",
       "                               'answers': 10,\n",
       "                               'students': 31,\n",
       "                               'parents': 5,\n",
       "                               'classes': 2,\n",
       "                               'laurels': 1,\n",
       "                               'colleagues': 6,\n",
       "                               'actions': 5,\n",
       "                               'teachers': 11,\n",
       "                               'provisions': 6,\n",
       "                               'laws': 8,\n",
       "                               'Prosecutors': 2,\n",
       "                               'scores': 11,\n",
       "                               'educators': 5,\n",
       "                               'states': 11,\n",
       "                               'erasures': 1,\n",
       "                               'ones': 9,\n",
       "                               'occurrences': 1,\n",
       "                               'practices': 5,\n",
       "                               'booklets': 5,\n",
       "                               'areas': 10,\n",
       "                               'Experts': 1,\n",
       "                               'promotions': 2,\n",
       "                               'districts': 4,\n",
       "                               'interventions': 1,\n",
       "                               'firings': 1,\n",
       "                               'grants': 1,\n",
       "                               'projects': 3,\n",
       "                               'reforms': 6,\n",
       "                               'Critics': 2,\n",
       "                               'administrators': 1,\n",
       "                               'allegations': 2,\n",
       "                               'inferences': 1,\n",
       "                               'worries': 1,\n",
       "                               'governors': 2,\n",
       "                               'bricks': 1,\n",
       "                               'gangs': 1,\n",
       "                               'kids': 5,\n",
       "                               'honors': 1,\n",
       "                               'programs': 23,\n",
       "                               'halls': 1,\n",
       "                               'neighborhoods': 2,\n",
       "                               'blacks': 6,\n",
       "                               'ambitions': 2,\n",
       "                               'reformers': 2,\n",
       "                               'things': 15,\n",
       "                               'cheerleaders': 1,\n",
       "                               'approaches': 1,\n",
       "                               'competitions': 1,\n",
       "                               'weekends': 1,\n",
       "                               'stands': 2,\n",
       "                               'Pressures': 1,\n",
       "                               'Friends': 1,\n",
       "                               'points': 30,\n",
       "                               'others': 14,\n",
       "                               'studies': 3,\n",
       "                               'motives': 1,\n",
       "                               'subjects': 2,\n",
       "                               'rankings': 1,\n",
       "                               'newspapers': 4,\n",
       "                               'alumni': 1,\n",
       "                               'hands': 6,\n",
       "                               'superiors': 1,\n",
       "                               'authorities': 5,\n",
       "                               'callers': 2,\n",
       "                               'particulars': 1,\n",
       "                               'policies': 4,\n",
       "                               'Editorials': 1,\n",
       "                               'offenders': 3,\n",
       "                               'witnesses': 1,\n",
       "                               'T-shirts': 1,\n",
       "                               'corridors': 1,\n",
       "                               'shirts': 1,\n",
       "                               'aspersions': 1,\n",
       "                               'worms': 1,\n",
       "                               'workbooks': 1,\n",
       "                               'worksheets': 2,\n",
       "                               'two-sevenths': 1,\n",
       "                               'three-sevenths': 1,\n",
       "                               'Worksheets': 1,\n",
       "                               'instances': 2,\n",
       "                               'parallels': 2,\n",
       "                               'critics': 8,\n",
       "                               'aids': 1,\n",
       "                               'tools': 1,\n",
       "                               'binders': 1,\n",
       "                               'preparatives': 1,\n",
       "                               'subskills': 2,\n",
       "                               'graphs': 1,\n",
       "                               'kits': 1,\n",
       "                               'sounds': 3,\n",
       "                               'examples': 1,\n",
       "                               'matches': 1,\n",
       "                               'items': 6,\n",
       "                               'offices': 5,\n",
       "                               'services': 25,\n",
       "                               'transplants': 9,\n",
       "                               'humans': 1,\n",
       "                               'anti-abortionists': 2,\n",
       "                               'therapies': 1,\n",
       "                               'abortions': 1,\n",
       "                               'implications': 2,\n",
       "                               'doctors': 1,\n",
       "                               'posts': 3,\n",
       "                               'names': 3,\n",
       "                               'views': 5,\n",
       "                               'judgments': 1,\n",
       "                               'applications': 6,\n",
       "                               'foundations': 1,\n",
       "                               'tissues': 2,\n",
       "                               'fronts': 1,\n",
       "                               'genes': 2,\n",
       "                               'regions': 3,\n",
       "                               'traders': 48,\n",
       "                               'targets': 3,\n",
       "                               'speculators': 3,\n",
       "                               'losses': 13,\n",
       "                               'ADRs': 2,\n",
       "                               'warnings': 2,\n",
       "                               'attorneys': 6,\n",
       "                               'cities': 5,\n",
       "                               'transactions': 21,\n",
       "                               'Attorneys': 2,\n",
       "                               'identities': 1,\n",
       "                               'dozens': 4,\n",
       "                               'letters': 9,\n",
       "                               'accounts': 8,\n",
       "                               'individuals': 8,\n",
       "                               'circumstances': 3,\n",
       "                               'ethics': 1,\n",
       "                               'taxpayers': 5,\n",
       "                               '8300s': 1,\n",
       "                               'Individuals': 1,\n",
       "                               'Lawyers': 1,\n",
       "                               'returns': 11,\n",
       "                               'assertions': 1,\n",
       "                               'SALARIES': 1,\n",
       "                               'judges': 7,\n",
       "                               'clerks': 1,\n",
       "                               'Judges': 1,\n",
       "                               'accountants': 1,\n",
       "                               'TROUBLES': 1,\n",
       "                               'screenwriters': 1,\n",
       "                               'threats': 2,\n",
       "                               'damages': 6,\n",
       "                               'referrals': 1,\n",
       "                               'activities': 9,\n",
       "                               'restrictions': 8,\n",
       "                               'providers': 1,\n",
       "                               'limits': 4,\n",
       "                               'comments': 3,\n",
       "                               'calls': 1,\n",
       "                               'remarks': 1,\n",
       "                               'queers': 1,\n",
       "                               'boys': 2,\n",
       "                               'arguments': 2,\n",
       "                               'trials': 1,\n",
       "                               'mistrials': 1,\n",
       "                               'narcotics': 1,\n",
       "                               'Terms': 8,\n",
       "                               'feet': 3,\n",
       "                               'acres': 2,\n",
       "                               'bids': 10,\n",
       "                               'leaders': 10,\n",
       "                               'competitors': 2,\n",
       "                               'auctions': 5,\n",
       "                               'violations': 16,\n",
       "                               'situations': 2,\n",
       "                               'profits': 13,\n",
       "                               'benefits': 9,\n",
       "                               'gifts': 1,\n",
       "                               'businessmen': 1,\n",
       "                               'complaints': 4,\n",
       "                               'Foreigners': 1,\n",
       "                               'semiconductors': 1,\n",
       "                               'telecommunications': 4,\n",
       "                               'municipalities': 4,\n",
       "                               'headquarters': 4,\n",
       "                               'PAPERS': 1,\n",
       "                               'papers': 1,\n",
       "                               'media': 5,\n",
       "                               'shovels': 2,\n",
       "                               'thrifts': 4,\n",
       "                               'billings': 1,\n",
       "                               'techniques': 4,\n",
       "                               'wafers': 1,\n",
       "                               'additions': 2,\n",
       "                               'buyers': 12,\n",
       "                               'jitters': 1,\n",
       "                               'marks': 8,\n",
       "                               'wings': 2,\n",
       "                               'cues': 1,\n",
       "                               'Dealers': 7,\n",
       "                               'participants': 4,\n",
       "                               'expectations': 5,\n",
       "                               'ounces': 3,\n",
       "                               'ratings': 10,\n",
       "                               'viewers': 1,\n",
       "                               'affiliates': 2,\n",
       "                               'shows': 3,\n",
       "                               'episodes': 2,\n",
       "                               'tactics': 1,\n",
       "                               'comedies': 1,\n",
       "                               'networks': 1,\n",
       "                               'magazines': 1,\n",
       "                               'articles': 1,\n",
       "                               'pieces': 2,\n",
       "                               'topics': 2,\n",
       "                               'essays': 1,\n",
       "                               'editors': 4,\n",
       "                               'aisles': 1,\n",
       "                               'guys': 1,\n",
       "                               'arrows': 1,\n",
       "                               'Modifications': 1,\n",
       "                               'experts': 7,\n",
       "                               'spenders': 2,\n",
       "                               'economics': 2,\n",
       "                               'revenues': 1,\n",
       "                               'subscriptions': 2,\n",
       "                               'newsstands': 1,\n",
       "                               'Billings': 1,\n",
       "                               'rentals': 1,\n",
       "                               'accidents': 1,\n",
       "                               'investor-relations': 1,\n",
       "                               'marketing-communications': 1,\n",
       "                               'proceeds': 2,\n",
       "                               'subsidiaries': 4,\n",
       "                               'advocates': 2,\n",
       "                               'steps': 2,\n",
       "                               'vans': 5,\n",
       "                               'requirements': 9,\n",
       "                               'automobiles': 3,\n",
       "                               'roofs': 2,\n",
       "                               'minivans': 5,\n",
       "                               'belts': 6,\n",
       "                               'headrests': 1,\n",
       "                               'communications': 1,\n",
       "                               'crashes': 1,\n",
       "                               'fatalities': 2,\n",
       "                               'bags': 1,\n",
       "                               'pounds': 3,\n",
       "                               'inches': 1,\n",
       "                               'pickups': 1,\n",
       "                               'railcars': 3,\n",
       "                               'autos': 1,\n",
       "                               'offers': 3,\n",
       "                               'options': 11,\n",
       "                               'conversations': 2,\n",
       "                               'accessories': 4,\n",
       "                               'metals': 7,\n",
       "                               'shops': 3,\n",
       "                               'segments': 8,\n",
       "                               'superpremiums': 2,\n",
       "                               'classics': 2,\n",
       "                               'growths': 2,\n",
       "                               'Champagnes': 1,\n",
       "                               'wines': 14,\n",
       "                               'releases': 2,\n",
       "                               'bottles': 1,\n",
       "                               'vintages': 2,\n",
       "                               'cuvees': 1,\n",
       "                               'reds': 1,\n",
       "                               'tags': 1,\n",
       "                               'grapes': 2,\n",
       "                               'merchants': 3,\n",
       "                               'responses': 3,\n",
       "                               'retailers': 1,\n",
       "                               'opinions': 1,\n",
       "                               'six-packs': 2,\n",
       "                               'Producers': 2,\n",
       "                               'ideas': 3,\n",
       "                               'holidays': 1,\n",
       "                               'Signs': 1,\n",
       "                               'presidents': 4,\n",
       "                               'excesses': 1,\n",
       "                               'hotels': 1,\n",
       "                               'autions': 1,\n",
       "                               'capital-gains': 1,\n",
       "                               'bankers': 4,\n",
       "                               'Auctions': 1,\n",
       "                               'noodles': 1,\n",
       "                               'Investors': 3,\n",
       "                               'chemicals': 6,\n",
       "                               'alternatives': 6,\n",
       "                               'proposals': 2,\n",
       "                               'combinations': 1,\n",
       "                               'two-thirds': 2,\n",
       "                               'acquisitions': 10,\n",
       "                               'Officials': 3,\n",
       "                               'barriers': 3,\n",
       "                               'differences': 7,\n",
       "                               'journalists': 1,\n",
       "                               'emotions': 1,\n",
       "                               'Fears': 1,\n",
       "                               'moves': 5,\n",
       "                               'fires': 1,\n",
       "                               'troubles': 4,\n",
       "                               'structures': 3,\n",
       "                               'recommendations': 3,\n",
       "                               'concessions': 1,\n",
       "                               'specifics': 1,\n",
       "                               'sights': 1,\n",
       "                               'stones': 1,\n",
       "                               'lesions': 1,\n",
       "                               'corporations': 6,\n",
       "                               'deals': 6,\n",
       "                               'anxieties': 2,\n",
       "                               'Mitsubishi': 1,\n",
       "                               'combines': 1,\n",
       "                               'commodities': 4,\n",
       "                               'ships': 7,\n",
       "                               'houses': 7,\n",
       "                               'ventures': 2,\n",
       "                               'objectives': 2,\n",
       "                               'airlines': 2,\n",
       "                               'airports': 1,\n",
       "                               'duties': 8,\n",
       "                               'deposits': 4,\n",
       "                               'packages': 7,\n",
       "                               'adults': 1,\n",
       "                               'sub-segments': 1,\n",
       "                               'styles': 1,\n",
       "                               'sub-markets': 1,\n",
       "                               'branches': 3,\n",
       "                               'games': 2,\n",
       "                               'Banks': 2,\n",
       "                               'travelers': 1,\n",
       "                               'checks': 2,\n",
       "                               'copycats': 1,\n",
       "                               'margins': 7,\n",
       "                               'niches': 1,\n",
       "                               'ways': 9,\n",
       "                               'CDs': 1,\n",
       "                               'certificates': 1,\n",
       "                               'battles': 1,\n",
       "                               'unions': 2,\n",
       "                               'Packages': 1,\n",
       "                               'borrowers': 1,\n",
       "                               'savers\\\\/investors': 1,\n",
       "                               'drawbacks': 1,\n",
       "                               'personnel': 1,\n",
       "                               'needs': 2,\n",
       "                               'IRAs': 1,\n",
       "                               'doors': 1,\n",
       "                               'semesters': 1,\n",
       "                               'slides': 1,\n",
       "                               'halts': 3,\n",
       "                               'emergencies': 1,\n",
       "                               'futures': 63,\n",
       "                               'trades': 19,\n",
       "                               'industrials': 3,\n",
       "                               'sell-offs': 1,\n",
       "                               'minutes': 4,\n",
       "                               'aides': 2,\n",
       "                               'congressmen': 2,\n",
       "                               'legislators': 1,\n",
       "                               'breakers': 1,\n",
       "                               'viewpoints': 1,\n",
       "                               'sources': 8,\n",
       "                               'committees': 1,\n",
       "                               'English': 1,\n",
       "                               'peculiarities': 1,\n",
       "                               'bells': 19,\n",
       "                               'parishioners': 1,\n",
       "                               'ropes': 4,\n",
       "                               'church-goers': 1,\n",
       "                               'churches': 4,\n",
       "                               'ringers': 21,\n",
       "                               'octogenarians': 1,\n",
       "                               'youngsters': 2,\n",
       "                               'belfries': 1,\n",
       "                               'discos': 1,\n",
       "                               'dances': 1,\n",
       "                               'ranks': 2,\n",
       "                               'Sundays': 1,\n",
       "                               'tunes': 1,\n",
       "                               'carillons': 1,\n",
       "                               'foreigners': 1,\n",
       "                               'rounds': 1,\n",
       "                               'Ringers': 2,\n",
       "                               'methods': 3,\n",
       "                               'pulls': 1,\n",
       "                               'wheels': 1,\n",
       "                               'wrists': 1,\n",
       "                               'clerics': 1,\n",
       "                               'vicars': 2,\n",
       "                               'stairs': 1,\n",
       "                               'feelings': 1,\n",
       "                               'hopes': 3,\n",
       "                               'colleges': 1,\n",
       "                               'joys': 1,\n",
       "                               'bellringers': 1,\n",
       "                               'parishes': 1,\n",
       "                               'peals': 2,\n",
       "                               'replies': 1,\n",
       "                               'payouts': 3,\n",
       "                               'spiders': 1,\n",
       "                               'males': 1,\n",
       "                               'environments': 2,\n",
       "                               'peaks': 2,\n",
       "                               'watchers': 3,\n",
       "                               'Payouts': 1,\n",
       "                               'estimates': 6,\n",
       "                               'trends': 2,\n",
       "                               'advances': 2,\n",
       "                               'exits': 1,\n",
       "                               'Stockholders': 1,\n",
       "                               'slowdowns': 1,\n",
       "                               'bulls': 1,\n",
       "                               'expenditures': 1,\n",
       "                               'quarters': 4,\n",
       "                               'strains': 2,\n",
       "                               'demonstrators': 2,\n",
       "                               'platitudes': 1,\n",
       "                               'killings': 1,\n",
       "                               'demonstrations': 1,\n",
       "                               'exchanges': 3,\n",
       "                               'Relations': 1,\n",
       "                               'contacts': 2,\n",
       "                               'Ideas': 1,\n",
       "                               'borders': 1,\n",
       "                               'guards': 5,\n",
       "                               'guns': 1,\n",
       "                               'blocks': 1,\n",
       "                               'arms': 3,\n",
       "                               'pistols': 1,\n",
       "                               'plainclothes': 1,\n",
       "                               'police': 3,\n",
       "                               'soldiers': 1,\n",
       "                               'protests': 3,\n",
       "                               'rifles': 2,\n",
       "                               'diplomats': 1,\n",
       "                               'Firms': 1,\n",
       "                               'Graduates': 1,\n",
       "                               'images': 1,\n",
       "                               'perceptions': 1,\n",
       "                               'salaries': 1,\n",
       "                               'vacations': 2,\n",
       "                               'Ratings': 1,\n",
       "                               'negatives': 1,\n",
       "                               'liberals': 1,\n",
       "                               'professionals': 4,\n",
       "                               'voters': 5,\n",
       "                               'three-quarters': 1,\n",
       "                               'suspensions': 2,\n",
       "                               'principals': 2,\n",
       "                               'requests': 1,\n",
       "                               'agents': 4,\n",
       "                               'reps': 1,\n",
       "                               'mistakes': 1,\n",
       "                               'hurdles': 1,\n",
       "                               'mechanisms': 1,\n",
       "                               'operators': 2,\n",
       "                               'strategies': 3,\n",
       "                               'attractions': 2,\n",
       "                               'tapes': 1,\n",
       "                               'index-options': 1,\n",
       "                               'derivatives': 1,\n",
       "                               'proponents': 2,\n",
       "                               'Advocates': 1,\n",
       "                               'opponents': 3,\n",
       "                               'smiles': 1,\n",
       "                               'administrations': 1,\n",
       "                               'skills': 1,\n",
       "                               'entrants': 1,\n",
       "                               'Employers': 1,\n",
       "                               'employers': 1,\n",
       "                               'microcomputers': 1,\n",
       "                               'observers': 4,\n",
       "                               'insiders': 2,\n",
       "                               'Associates': 1,\n",
       "                               'universities': 1,\n",
       "                               'protesters': 2,\n",
       "                               'classmates': 1,\n",
       "                               'building-products': 1,\n",
       "                               'covers': 2,\n",
       "                               'cycles': 1,\n",
       "                               'reins': 1,\n",
       "                               'forest-products': 2,\n",
       "                               'waters': 3,\n",
       "                               'portions': 2,\n",
       "                               'guarantees': 5,\n",
       "                               'appropriators': 2,\n",
       "                               'initiatives': 4,\n",
       "                               'appropriations': 25,\n",
       "                               'amendments': 2,\n",
       "                               'tons': 10,\n",
       "                               'growers': 1,\n",
       "                               'allies': 1,\n",
       "                               'flights': 2,\n",
       "                               'departments': 1,\n",
       "                               'bridges': 3,\n",
       "                               'railings': 4,\n",
       "                               'openings': 2,\n",
       "                               'medallions': 1,\n",
       "                               'Compromises': 1,\n",
       "                               'Citizens': 1,\n",
       "                               'Cartons': 1,\n",
       "                               'POTABLES': 1,\n",
       "                               'trays': 2,\n",
       "                               'outlets': 2,\n",
       "                               'loops': 2,\n",
       "                               'cups': 1,\n",
       "                               'Lids': 1,\n",
       "                               'carriers': 1,\n",
       "                               'designers': 3,\n",
       "                               'chairs': 1,\n",
       "                               'corkscrews': 1,\n",
       "                               'BIRDS': 1,\n",
       "                               'architects': 1,\n",
       "                               'prisoners': 1,\n",
       "                               'solutions': 1,\n",
       "                               'walls': 1,\n",
       "                               'cells': 1,\n",
       "                               'visits': 1,\n",
       "                               'reasons': 4,\n",
       "                               'pyramids': 2,\n",
       "                               'inmates': 1,\n",
       "                               'fines': 4,\n",
       "                               ...}),\n",
       "                     'PDT': FreqDist({'All': 1,\n",
       "                               'Such': 2,\n",
       "                               'all': 14,\n",
       "                               'both': 1,\n",
       "                               'half': 4,\n",
       "                               'such': 5}),\n",
       "                     'POS': FreqDist({\"'\": 63, \"'s\": 761}),\n",
       "                     'PRP': FreqDist({'He': 73,\n",
       "                               'I': 113,\n",
       "                               'IT': 1,\n",
       "                               'It': 100,\n",
       "                               'She': 21,\n",
       "                               'They': 53,\n",
       "                               'We': 47,\n",
       "                               'You': 24,\n",
       "                               'he': 230,\n",
       "                               'her': 18,\n",
       "                               'herself': 1,\n",
       "                               'him': 16,\n",
       "                               'himself': 9,\n",
       "                               'it': 476,\n",
       "                               'itself': 7,\n",
       "                               'me': 9,\n",
       "                               'one': 2,\n",
       "                               'she': 77,\n",
       "                               'them': 70,\n",
       "                               'themselves': 12,\n",
       "                               'they': 210,\n",
       "                               'us': 26,\n",
       "                               'we': 48,\n",
       "                               'you': 70,\n",
       "                               'yourself': 3}),\n",
       "                     'PRP$': FreqDist({'Her': 4,\n",
       "                               'His': 5,\n",
       "                               'Its': 11,\n",
       "                               'My': 2,\n",
       "                               'Their': 3,\n",
       "                               'Your': 7,\n",
       "                               'her': 33,\n",
       "                               'his': 121,\n",
       "                               'its': 332,\n",
       "                               'my': 18,\n",
       "                               'our': 26,\n",
       "                               'their': 181,\n",
       "                               'your': 23}),\n",
       "                     'RB': FreqDist({'Academically': 1,\n",
       "                               'Actually': 1,\n",
       "                               'After': 1,\n",
       "                               'Again': 1,\n",
       "                               'Almost': 1,\n",
       "                               'Already': 1,\n",
       "                               'Also': 16,\n",
       "                               'Altogether': 1,\n",
       "                               'Always': 1,\n",
       "                               'As': 1,\n",
       "                               'Back': 1,\n",
       "                               'Certainly': 1,\n",
       "                               'Currently': 4,\n",
       "                               'Elsewhere': 2,\n",
       "                               'Even': 8,\n",
       "                               'Far': 1,\n",
       "                               'Financially': 1,\n",
       "                               'Frankly': 1,\n",
       "                               'Further': 2,\n",
       "                               'Generally': 1,\n",
       "                               'Here': 3,\n",
       "                               'However': 11,\n",
       "                               'Indeed': 6,\n",
       "                               'Instead': 5,\n",
       "                               'Invariably': 1,\n",
       "                               'Just': 4,\n",
       "                               'LATE': 1,\n",
       "                               'Late': 2,\n",
       "                               'Little': 1,\n",
       "                               'Maybe': 2,\n",
       "                               'Meanwhile': 9,\n",
       "                               'Moreover': 8,\n",
       "                               'Mostly': 1,\n",
       "                               'Much': 2,\n",
       "                               'Nevertheless': 2,\n",
       "                               'No': 1,\n",
       "                               'Nonetheless': 1,\n",
       "                               'Not': 7,\n",
       "                               'Now': 9,\n",
       "                               'Often': 1,\n",
       "                               'Once': 3,\n",
       "                               'Only': 5,\n",
       "                               'Otherwise': 1,\n",
       "                               'Particularly': 1,\n",
       "                               'Partly': 3,\n",
       "                               'Perhaps': 2,\n",
       "                               'Possibly': 1,\n",
       "                               'Previously': 4,\n",
       "                               'Prior': 1,\n",
       "                               'Probably': 1,\n",
       "                               'Rather': 2,\n",
       "                               'Recently': 1,\n",
       "                               'Right': 2,\n",
       "                               'Separately': 3,\n",
       "                               'Shortly': 1,\n",
       "                               'Similarly': 3,\n",
       "                               'So': 11,\n",
       "                               'Some': 2,\n",
       "                               'Sometimes': 2,\n",
       "                               'Soon': 2,\n",
       "                               'Still': 8,\n",
       "                               'Sure': 1,\n",
       "                               'Then': 7,\n",
       "                               'Thus': 3,\n",
       "                               'Too': 2,\n",
       "                               'Totally': 1,\n",
       "                               'Traditionally': 1,\n",
       "                               'Typically': 2,\n",
       "                               'Unfortunately': 1,\n",
       "                               'Virtually': 1,\n",
       "                               'Yet': 3,\n",
       "                               'about': 27,\n",
       "                               'above': 2,\n",
       "                               'abroad': 3,\n",
       "                               'absolutely': 2,\n",
       "                               'accidentally': 1,\n",
       "                               'accurately': 1,\n",
       "                               'actively': 2,\n",
       "                               'actually': 3,\n",
       "                               'adequately': 1,\n",
       "                               'after': 1,\n",
       "                               'afterwards': 1,\n",
       "                               'again': 14,\n",
       "                               'aggressively': 2,\n",
       "                               'ago': 16,\n",
       "                               'ahead': 9,\n",
       "                               'alike': 1,\n",
       "                               'all': 3,\n",
       "                               'allegedly': 3,\n",
       "                               'almost': 22,\n",
       "                               'alone': 6,\n",
       "                               'already': 35,\n",
       "                               'also': 147,\n",
       "                               'alternatively': 1,\n",
       "                               'altogether': 1,\n",
       "                               'always': 15,\n",
       "                               'amazingly': 1,\n",
       "                               'annually': 4,\n",
       "                               'any': 2,\n",
       "                               'anytime': 2,\n",
       "                               'anyway': 1,\n",
       "                               'anywhere': 1,\n",
       "                               'apart': 1,\n",
       "                               'apiece': 2,\n",
       "                               'apparently': 14,\n",
       "                               'approximately': 2,\n",
       "                               'around': 3,\n",
       "                               'as': 52,\n",
       "                               'away': 13,\n",
       "                               'awfully': 1,\n",
       "                               'back': 15,\n",
       "                               'badly': 3,\n",
       "                               'barely': 1,\n",
       "                               'basically': 5,\n",
       "                               'because': 2,\n",
       "                               'before': 6,\n",
       "                               'beforehand': 1,\n",
       "                               'below': 1,\n",
       "                               'brilliantly': 1,\n",
       "                               'broadly': 1,\n",
       "                               'but': 1,\n",
       "                               'by': 1,\n",
       "                               'carefully': 1,\n",
       "                               'cautiously': 1,\n",
       "                               'certainly': 4,\n",
       "                               'chiefly': 1,\n",
       "                               'clear': 1,\n",
       "                               'clearly': 6,\n",
       "                               'close': 2,\n",
       "                               'closely': 15,\n",
       "                               'comfortably': 1,\n",
       "                               'completely': 2,\n",
       "                               'considerably': 4,\n",
       "                               'consistently': 2,\n",
       "                               'constantly': 3,\n",
       "                               'continually': 3,\n",
       "                               'continuingly': 1,\n",
       "                               'continuously': 1,\n",
       "                               'currently': 22,\n",
       "                               'damn': 2,\n",
       "                               'darned': 1,\n",
       "                               'deeply': 1,\n",
       "                               'definitely': 1,\n",
       "                               'deliberately': 1,\n",
       "                               'derisively': 1,\n",
       "                               'desperately': 1,\n",
       "                               'differently': 1,\n",
       "                               'directly': 6,\n",
       "                               'domestically': 1,\n",
       "                               'down': 22,\n",
       "                               'downright': 1,\n",
       "                               'downward': 1,\n",
       "                               'dramatically': 2,\n",
       "                               'drastically': 1,\n",
       "                               'due': 1,\n",
       "                               'duly': 2,\n",
       "                               'earlier': 3,\n",
       "                               'early': 14,\n",
       "                               'easily': 6,\n",
       "                               'editorially': 2,\n",
       "                               'effectively': 4,\n",
       "                               'either': 2,\n",
       "                               'else': 3,\n",
       "                               'elsewhere': 3,\n",
       "                               'enormously': 1,\n",
       "                               'enough': 12,\n",
       "                               'entirely': 4,\n",
       "                               'equally': 4,\n",
       "                               'especially': 9,\n",
       "                               'essentially': 8,\n",
       "                               'even': 64,\n",
       "                               'evenly': 2,\n",
       "                               'eventually': 8,\n",
       "                               'ever': 9,\n",
       "                               'everywhere': 2,\n",
       "                               'exactly': 1,\n",
       "                               'exceedingly': 1,\n",
       "                               'exceptionally': 2,\n",
       "                               'excessively': 1,\n",
       "                               'exclusively': 1,\n",
       "                               'expressly': 1,\n",
       "                               'extremely': 4,\n",
       "                               'fairly': 5,\n",
       "                               'far': 28,\n",
       "                               'fast': 2,\n",
       "                               'faultlessly': 1,\n",
       "                               'favorably': 1,\n",
       "                               'federally': 1,\n",
       "                               'finally': 4,\n",
       "                               'financially': 3,\n",
       "                               'fine': 1,\n",
       "                               'firmly': 1,\n",
       "                               'first': 9,\n",
       "                               'flat': 1,\n",
       "                               'for': 1,\n",
       "                               'formally': 2,\n",
       "                               'formerly': 3,\n",
       "                               'forward': 4,\n",
       "                               'fractionally': 2,\n",
       "                               'frankly': 1,\n",
       "                               'free': 1,\n",
       "                               'frequently': 5,\n",
       "                               'fully': 12,\n",
       "                               'fundamentally': 1,\n",
       "                               'further': 4,\n",
       "                               'generally': 13,\n",
       "                               'globally': 1,\n",
       "                               'gradually': 1,\n",
       "                               'greatly': 3,\n",
       "                               'hard': 5,\n",
       "                               'hardly': 4,\n",
       "                               'harshly': 2,\n",
       "                               'heavily': 7,\n",
       "                               'here': 20,\n",
       "                               'high': 2,\n",
       "                               'highly': 12,\n",
       "                               'historically': 3,\n",
       "                               'hither': 1,\n",
       "                               'home': 1,\n",
       "                               'honorably': 1,\n",
       "                               'hopefully': 3,\n",
       "                               'however': 24,\n",
       "                               'hydraulically': 1,\n",
       "                               'illegally': 2,\n",
       "                               'immediately': 3,\n",
       "                               'implicitly': 1,\n",
       "                               'in': 2,\n",
       "                               'inaccurately': 1,\n",
       "                               'increasingly': 4,\n",
       "                               'indeed': 3,\n",
       "                               'indefinitely': 2,\n",
       "                               'informally': 1,\n",
       "                               'inherently': 1,\n",
       "                               'initially': 5,\n",
       "                               'instead': 8,\n",
       "                               'intimately': 1,\n",
       "                               'invariably': 1,\n",
       "                               'jointly': 8,\n",
       "                               'just': 44,\n",
       "                               'laboriously': 1,\n",
       "                               'largely': 12,\n",
       "                               'last': 1,\n",
       "                               'late': 2,\n",
       "                               'lately': 1,\n",
       "                               'likely': 2,\n",
       "                               'little': 9,\n",
       "                               'locally': 1,\n",
       "                               'long': 11,\n",
       "                               'longer': 1,\n",
       "                               'low': 1,\n",
       "                               'madly': 1,\n",
       "                               'mainly': 5,\n",
       "                               'manually': 2,\n",
       "                               'marginally': 2,\n",
       "                               'marvelously': 1,\n",
       "                               'maybe': 1,\n",
       "                               'meanwhile': 5,\n",
       "                               'mechanically': 1,\n",
       "                               'mentally': 2,\n",
       "                               'merely': 5,\n",
       "                               'mistakenly': 1,\n",
       "                               'moderately': 2,\n",
       "                               'modestly': 5,\n",
       "                               'monthly': 1,\n",
       "                               'moreover': 1,\n",
       "                               'mostly': 7,\n",
       "                               'much': 30,\n",
       "                               \"n't\": 325,\n",
       "                               'namely': 3,\n",
       "                               'narrowly': 1,\n",
       "                               'nearby': 1,\n",
       "                               'nearly': 17,\n",
       "                               'necessarily': 2,\n",
       "                               'never': 20,\n",
       "                               'newly': 3,\n",
       "                               'newsweekly': 1,\n",
       "                               'no': 10,\n",
       "                               'noncompetitively': 1,\n",
       "                               'nonetheless': 1,\n",
       "                               'normally': 4,\n",
       "                               'not': 133,\n",
       "                               'notably': 3,\n",
       "                               'now': 61,\n",
       "                               'nowhere': 2,\n",
       "                               'obviously': 2,\n",
       "                               'occasionally': 2,\n",
       "                               'off': 4,\n",
       "                               'officially': 7,\n",
       "                               'often': 24,\n",
       "                               'on': 1,\n",
       "                               'once': 13,\n",
       "                               'only': 68,\n",
       "                               'openly': 2,\n",
       "                               'originally': 3,\n",
       "                               'otherwise': 1,\n",
       "                               'out': 3,\n",
       "                               'over': 2,\n",
       "                               'overseas': 4,\n",
       "                               'p.m': 2,\n",
       "                               'partially': 3,\n",
       "                               'particularly': 17,\n",
       "                               'partly': 9,\n",
       "                               'perfectly': 2,\n",
       "                               'perhaps': 10,\n",
       "                               'personally': 1,\n",
       "                               'plus': 1,\n",
       "                               'politely': 1,\n",
       "                               'politically': 1,\n",
       "                               'poorly': 4,\n",
       "                               'popularly': 1,\n",
       "                               'possibly': 6,\n",
       "                               'potentially': 1,\n",
       "                               'precisely': 4,\n",
       "                               'predictably': 1,\n",
       "                               'presumably': 2,\n",
       "                               'pretty': 7,\n",
       "                               'previously': 10,\n",
       "                               'primarily': 6,\n",
       "                               'prior': 4,\n",
       "                               'privately': 6,\n",
       "                               'probably': 14,\n",
       "                               'profitably': 2,\n",
       "                               'prominently': 1,\n",
       "                               'promptly': 3,\n",
       "                               'properly': 1,\n",
       "                               'prospectively': 1,\n",
       "                               'publicly': 11,\n",
       "                               'purely': 1,\n",
       "                               'quarterly': 1,\n",
       "                               'quickly': 13,\n",
       "                               'quietly': 1,\n",
       "                               'quite': 4,\n",
       "                               'radically': 1,\n",
       "                               'rapidly': 6,\n",
       "                               'rarely': 1,\n",
       "                               'rather': 16,\n",
       "                               'real': 1,\n",
       "                               'really': 12,\n",
       "                               'reasonably': 1,\n",
       "                               'recently': 25,\n",
       "                               'regardless': 1,\n",
       "                               'relatively': 11,\n",
       "                               'relentlessly': 1,\n",
       "                               'repeatedly': 1,\n",
       "                               'reportedly': 1,\n",
       "                               'rhythmically': 1,\n",
       "                               'right': 7,\n",
       "                               'robustly': 1,\n",
       "                               'roughly': 9,\n",
       "                               'satisfactorily': 1,\n",
       "                               'scarcely': 1,\n",
       "                               'scrupulously': 1,\n",
       "                               'seasonally': 2,\n",
       "                               'separately': 1,\n",
       "                               'seriously': 3,\n",
       "                               'sharply': 11,\n",
       "                               'short': 2,\n",
       "                               'shortly': 4,\n",
       "                               'significantly': 6,\n",
       "                               'simply': 7,\n",
       "                               'simultaneously': 1,\n",
       "                               'single-handedly': 2,\n",
       "                               'skyward': 1,\n",
       "                               'slightly': 10,\n",
       "                               'slow': 1,\n",
       "                               'slowly': 4,\n",
       "                               'smartly': 1,\n",
       "                               'smoothly': 1,\n",
       "                               'so': 55,\n",
       "                               'solely': 1,\n",
       "                               'somehow': 1,\n",
       "                               'sometimes': 8,\n",
       "                               'somewhat': 2,\n",
       "                               'soon': 11,\n",
       "                               'sooner': 1,\n",
       "                               'south': 1,\n",
       "                               'spectacularly': 1,\n",
       "                               'staunchly': 1,\n",
       "                               'steadily': 1,\n",
       "                               'still': 36,\n",
       "                               'stocks': 1,\n",
       "                               'straight': 2,\n",
       "                               'strictly': 1,\n",
       "                               'stringently': 1,\n",
       "                               'strongly': 3,\n",
       "                               'structurally': 1,\n",
       "                               'studiously': 1,\n",
       "                               'substantially': 7,\n",
       "                               'successfully': 1,\n",
       "                               'suddenly': 2,\n",
       "                               'sufficiently': 1,\n",
       "                               'supposedly': 2,\n",
       "                               'sure': 1,\n",
       "                               'surely': 2,\n",
       "                               'surprisingly': 3,\n",
       "                               'surreptitiously': 1,\n",
       "                               'swiftly': 3,\n",
       "                               'technically': 1,\n",
       "                               'temporarily': 8,\n",
       "                               'tenfold': 1,\n",
       "                               'tentatively': 6,\n",
       "                               'that': 3,\n",
       "                               'then': 27,\n",
       "                               'there': 12,\n",
       "                               'therefore': 1,\n",
       "                               'though': 4,\n",
       "                               'thus': 4,\n",
       "                               'tidily': 1,\n",
       "                               'tight': 1,\n",
       "                               'together': 6,\n",
       "                               'too': 22,\n",
       "                               'traditionally': 2,\n",
       "                               'triple': 1,\n",
       "                               'twice': 1,\n",
       "                               'typically': 3,\n",
       "                               'ultimately': 2,\n",
       "                               'unbearably': 1,\n",
       "                               'unfairly': 4,\n",
       "                               'universally': 1,\n",
       "                               'unrealistically': 1,\n",
       "                               'unsuccessfully': 2,\n",
       "                               'unusually': 2,\n",
       "                               'up': 49,\n",
       "                               'upside': 1,\n",
       "                               'upstream': 1,\n",
       "                               'usually': 10,\n",
       "                               'utterly': 1,\n",
       "                               'vertically': 1,\n",
       "                               'very': 28,\n",
       "                               'vice': 1,\n",
       "                               'virtually': 6,\n",
       "                               'vitally': 1,\n",
       "                               'voluntarily': 2,\n",
       "                               'well': 46,\n",
       "                               'wide': 1,\n",
       "                               'widely': 10,\n",
       "                               'wildly': 1,\n",
       "                               'yes': 1,\n",
       "                               'yet': 14,\n",
       "                               'yon': 1}),\n",
       "                     'RBR': FreqDist({'Earlier': 1,\n",
       "                               'More': 2,\n",
       "                               'better': 9,\n",
       "                               'closer': 1,\n",
       "                               'drearier': 1,\n",
       "                               'earlier': 11,\n",
       "                               'further': 2,\n",
       "                               'harder': 1,\n",
       "                               'higher': 2,\n",
       "                               'later': 2,\n",
       "                               'less': 11,\n",
       "                               'longer': 4,\n",
       "                               'lower': 1,\n",
       "                               'more': 86,\n",
       "                               'never': 1,\n",
       "                               'sooner': 1}),\n",
       "                     'RBS': FreqDist({'Most': 2, 'most': 33}),\n",
       "                     'RP': FreqDist({'about': 3,\n",
       "                               'across': 1,\n",
       "                               'around': 3,\n",
       "                               'away': 4,\n",
       "                               'back': 6,\n",
       "                               'by': 1,\n",
       "                               'down': 14,\n",
       "                               'for': 1,\n",
       "                               'in': 15,\n",
       "                               'off': 27,\n",
       "                               'on': 6,\n",
       "                               'out': 47,\n",
       "                               'over': 7,\n",
       "                               'through': 1,\n",
       "                               'together': 3,\n",
       "                               'up': 77}),\n",
       "                     'SYM': FreqDist({'&': 1}),\n",
       "                     'TO': FreqDist({'TO': 1, 'To': 17, 'to': 2161}),\n",
       "                     'UH': FreqDist({'OK': 1, 'Oh': 1, 'no': 1}),\n",
       "                     'VB': FreqDist({'Buy': 3,\n",
       "                               \"C'mon\": 1,\n",
       "                               'Choose': 1,\n",
       "                               'Compare': 1,\n",
       "                               'Consider': 1,\n",
       "                               'Do': 1,\n",
       "                               'Eliminate': 1,\n",
       "                               'Forget': 1,\n",
       "                               'Hold': 1,\n",
       "                               'Kill': 1,\n",
       "                               'Make': 1,\n",
       "                               'Note': 1,\n",
       "                               'Pick': 1,\n",
       "                               'Put': 2,\n",
       "                               'Remember': 1,\n",
       "                               'Send': 1,\n",
       "                               'Sit': 1,\n",
       "                               'Take': 6,\n",
       "                               'Think': 2,\n",
       "                               'abandon': 2,\n",
       "                               'abide': 1,\n",
       "                               'accept': 2,\n",
       "                               'accommodate': 3,\n",
       "                               'accompany': 1,\n",
       "                               'account': 1,\n",
       "                               'accrue': 1,\n",
       "                               'achieve': 2,\n",
       "                               'acknowledge': 1,\n",
       "                               'acquire': 10,\n",
       "                               'act': 6,\n",
       "                               'add': 5,\n",
       "                               'address': 2,\n",
       "                               'administer': 1,\n",
       "                               'adopt': 1,\n",
       "                               'advance': 1,\n",
       "                               'advertise': 3,\n",
       "                               'affect': 1,\n",
       "                               'afford': 1,\n",
       "                               'agree': 1,\n",
       "                               'aid': 1,\n",
       "                               'aim': 1,\n",
       "                               'alleviate': 1,\n",
       "                               'allow': 5,\n",
       "                               'amend': 1,\n",
       "                               'analyze': 1,\n",
       "                               'announce': 2,\n",
       "                               'answer': 2,\n",
       "                               'apologize': 1,\n",
       "                               'appeal': 1,\n",
       "                               'appear': 1,\n",
       "                               'appease': 1,\n",
       "                               'apply': 4,\n",
       "                               'appoint': 1,\n",
       "                               'approve': 5,\n",
       "                               'argue': 1,\n",
       "                               'arrest': 1,\n",
       "                               'arrive': 1,\n",
       "                               'ask': 3,\n",
       "                               'assemble': 1,\n",
       "                               'assert': 1,\n",
       "                               'assess': 1,\n",
       "                               'assist': 1,\n",
       "                               'assume': 2,\n",
       "                               'assure': 1,\n",
       "                               'attack': 1,\n",
       "                               'attempt': 2,\n",
       "                               'attend': 3,\n",
       "                               'attract': 4,\n",
       "                               'audit': 1,\n",
       "                               'augment': 1,\n",
       "                               'avenge': 1,\n",
       "                               'avert': 1,\n",
       "                               'avoid': 6,\n",
       "                               'back': 1,\n",
       "                               'ban': 2,\n",
       "                               'bar': 1,\n",
       "                               'be': 356,\n",
       "                               'beat': 4,\n",
       "                               'become': 15,\n",
       "                               'beg': 1,\n",
       "                               'begin': 9,\n",
       "                               'believe': 3,\n",
       "                               'belong': 1,\n",
       "                               'bend': 1,\n",
       "                               'benefit': 2,\n",
       "                               'bless': 1,\n",
       "                               'blip': 1,\n",
       "                               'block': 6,\n",
       "                               'bludgeon': 1,\n",
       "                               'boast': 1,\n",
       "                               'bolster': 1,\n",
       "                               'book': 1,\n",
       "                               'boost': 8,\n",
       "                               'bounce': 1,\n",
       "                               'breach': 2,\n",
       "                               'break': 3,\n",
       "                               'breathe': 1,\n",
       "                               'brief': 1,\n",
       "                               'bring': 9,\n",
       "                               'broaden': 1,\n",
       "                               'buffet': 1,\n",
       "                               'build': 9,\n",
       "                               'buy': 47,\n",
       "                               'calculate': 1,\n",
       "                               'call': 1,\n",
       "                               'capitalize': 1,\n",
       "                               'capture': 4,\n",
       "                               'care': 4,\n",
       "                               'carry': 8,\n",
       "                               'catch': 1,\n",
       "                               'cause': 5,\n",
       "                               'celebrate': 1,\n",
       "                               'challenge': 1,\n",
       "                               'change': 6,\n",
       "                               'charge': 3,\n",
       "                               'chase': 1,\n",
       "                               'chat': 1,\n",
       "                               'cheat': 1,\n",
       "                               'check': 3,\n",
       "                               'choose': 4,\n",
       "                               'cite': 1,\n",
       "                               'claim': 2,\n",
       "                               'clarify': 2,\n",
       "                               'clean': 1,\n",
       "                               'clear': 3,\n",
       "                               'climb': 1,\n",
       "                               'close': 9,\n",
       "                               'color': 1,\n",
       "                               'combat': 1,\n",
       "                               'combine': 1,\n",
       "                               'come': 13,\n",
       "                               'command': 1,\n",
       "                               'comment': 8,\n",
       "                               'commit': 1,\n",
       "                               'compel': 1,\n",
       "                               'compensate': 2,\n",
       "                               'compete': 3,\n",
       "                               'complete': 6,\n",
       "                               'complicate': 1,\n",
       "                               'compromise': 2,\n",
       "                               'computerize': 1,\n",
       "                               'concentrate': 2,\n",
       "                               'concern': 1,\n",
       "                               'conclude': 2,\n",
       "                               'conduct': 1,\n",
       "                               'confirm': 2,\n",
       "                               'confuse': 1,\n",
       "                               'consider': 6,\n",
       "                               'consist': 1,\n",
       "                               'contain': 3,\n",
       "                               'contest': 1,\n",
       "                               'continue': 13,\n",
       "                               'contract': 1,\n",
       "                               'contradict': 2,\n",
       "                               'contribute': 2,\n",
       "                               'control': 1,\n",
       "                               'convert': 1,\n",
       "                               'convince': 1,\n",
       "                               'coordinate': 1,\n",
       "                               'cope': 2,\n",
       "                               'copy': 2,\n",
       "                               'correct': 1,\n",
       "                               'cost': 4,\n",
       "                               'counteract': 1,\n",
       "                               'cover': 5,\n",
       "                               'crack': 1,\n",
       "                               'craft': 1,\n",
       "                               'create': 6,\n",
       "                               'curb': 3,\n",
       "                               'cure': 1,\n",
       "                               'curtail': 2,\n",
       "                               'cut': 12,\n",
       "                               'deal': 1,\n",
       "                               'debate': 1,\n",
       "                               'decide': 4,\n",
       "                               'declare': 1,\n",
       "                               'decline': 4,\n",
       "                               'decrease': 1,\n",
       "                               'default': 1,\n",
       "                               'defeat': 1,\n",
       "                               'define': 2,\n",
       "                               'defuse': 1,\n",
       "                               'delay': 1,\n",
       "                               'delete': 1,\n",
       "                               'deliver': 2,\n",
       "                               'demand': 1,\n",
       "                               'demobilize': 1,\n",
       "                               'denounce': 1,\n",
       "                               'deny': 2,\n",
       "                               'depend': 1,\n",
       "                               'describe': 1,\n",
       "                               'deserve': 1,\n",
       "                               'design': 2,\n",
       "                               'despise': 1,\n",
       "                               'destroy': 1,\n",
       "                               'deter': 1,\n",
       "                               'determine': 3,\n",
       "                               'develop': 3,\n",
       "                               'devise': 1,\n",
       "                               'devote': 2,\n",
       "                               'die': 4,\n",
       "                               'diminish': 1,\n",
       "                               'direct': 3,\n",
       "                               'disappear': 1,\n",
       "                               'discharge': 2,\n",
       "                               'disclose': 1,\n",
       "                               'disconnect': 1,\n",
       "                               'discontinue': 1,\n",
       "                               'discourage': 1,\n",
       "                               'discredit': 1,\n",
       "                               'discuss': 5,\n",
       "                               'disgorge': 6,\n",
       "                               'display': 1,\n",
       "                               'disseminate': 1,\n",
       "                               'diversify': 2,\n",
       "                               'divest': 1,\n",
       "                               'do': 34,\n",
       "                               'double': 1,\n",
       "                               'draw': 2,\n",
       "                               'drop': 4,\n",
       "                               'duck': 1,\n",
       "                               'earn': 2,\n",
       "                               'ease': 6,\n",
       "                               'eclipse': 1,\n",
       "                               'elaborate': 7,\n",
       "                               'eliminate': 5,\n",
       "                               'emasculate': 1,\n",
       "                               'emerge': 1,\n",
       "                               'emigrate': 1,\n",
       "                               'enable': 1,\n",
       "                               'enact': 1,\n",
       "                               'encounter': 1,\n",
       "                               'encourage': 2,\n",
       "                               'end': 7,\n",
       "                               'endorse': 1,\n",
       "                               'enforce': 2,\n",
       "                               'engage': 1,\n",
       "                               'ensure': 1,\n",
       "                               'enter': 1,\n",
       "                               'entertain': 1,\n",
       "                               'entice': 1,\n",
       "                               'entrench': 1,\n",
       "                               'equip': 1,\n",
       "                               'erect': 1,\n",
       "                               'erode': 1,\n",
       "                               'establish': 2,\n",
       "                               'estimate': 1,\n",
       "                               'even': 1,\n",
       "                               'evolve': 1,\n",
       "                               'exceed': 3,\n",
       "                               'exchange': 2,\n",
       "                               'excise': 1,\n",
       "                               'execute': 4,\n",
       "                               'exercise': 5,\n",
       "                               'exist': 1,\n",
       "                               'expand': 5,\n",
       "                               'expect': 2,\n",
       "                               'experience': 1,\n",
       "                               'expire': 4,\n",
       "                               'explain': 2,\n",
       "                               'exploit': 1,\n",
       "                               'explore': 1,\n",
       "                               'export': 2,\n",
       "                               'extend': 7,\n",
       "                               'fabricate': 1,\n",
       "                               'face': 10,\n",
       "                               'facilitate': 1,\n",
       "                               'fail': 1,\n",
       "                               'faint': 1,\n",
       "                               'fall': 6,\n",
       "                               'falsify': 1,\n",
       "                               'favor': 1,\n",
       "                               'feel': 3,\n",
       "                               'fend': 1,\n",
       "                               'figure': 2,\n",
       "                               'file': 6,\n",
       "                               'fill': 2,\n",
       "                               'finance': 5,\n",
       "                               'find': 11,\n",
       "                               'flourish': 1,\n",
       "                               'fly': 1,\n",
       "                               'focus': 4,\n",
       "                               'fold': 2,\n",
       "                               'follow': 2,\n",
       "                               'force': 6,\n",
       "                               'form': 1,\n",
       "                               'free': 1,\n",
       "                               'fuel': 1,\n",
       "                               'fund': 2,\n",
       "                               'gain': 4,\n",
       "                               'gather': 1,\n",
       "                               'gauge': 2,\n",
       "                               'generate': 1,\n",
       "                               'get': 40,\n",
       "                               'give': 15,\n",
       "                               'glamorize': 1,\n",
       "                               'go': 18,\n",
       "                               'grant': 3,\n",
       "                               'grapple': 1,\n",
       "                               'guarantee': 1,\n",
       "                               'gyrate': 1,\n",
       "                               'halt': 1,\n",
       "                               'halve': 1,\n",
       "                               'handle': 2,\n",
       "                               'hang': 1,\n",
       "                               'happen': 5,\n",
       "                               'harass': 2,\n",
       "                               'have': 101,\n",
       "                               'head': 1,\n",
       "                               'hear': 4,\n",
       "                               'help': 37,\n",
       "                               'herald': 1,\n",
       "                               'highlight': 1,\n",
       "                               'hire': 2,\n",
       "                               'hit': 2,\n",
       "                               'hold': 4,\n",
       "                               'honor': 3,\n",
       "                               'hope': 1,\n",
       "                               'house': 2,\n",
       "                               'hunker': 1,\n",
       "                               'hurt': 3,\n",
       "                               'identify': 2,\n",
       "                               'imagine': 1,\n",
       "                               'impart': 1,\n",
       "                               'impede': 1,\n",
       "                               'implant': 1,\n",
       "                               'implement': 2,\n",
       "                               'impose': 3,\n",
       "                               'improve': 11,\n",
       "                               'include': 3,\n",
       "                               'increase': 11,\n",
       "                               'indicate': 2,\n",
       "                               'induce': 1,\n",
       "                               'inform': 1,\n",
       "                               'inhibit': 1,\n",
       "                               'insert': 1,\n",
       "                               'install': 2,\n",
       "                               'institute': 1,\n",
       "                               'intend': 1,\n",
       "                               'intimidate': 1,\n",
       "                               'introduce': 7,\n",
       "                               'invent': 1,\n",
       "                               'investigate': 1,\n",
       "                               'invite': 1,\n",
       "                               'involve': 3,\n",
       "                               'issue': 6,\n",
       "                               'join': 4,\n",
       "                               'juggle': 1,\n",
       "                               'jump': 3,\n",
       "                               'junk': 1,\n",
       "                               'justify': 2,\n",
       "                               'keep': 15,\n",
       "                               'kill': 1,\n",
       "                               'know': 10,\n",
       "                               'land': 1,\n",
       "                               'last': 2,\n",
       "                               'launch': 2,\n",
       "                               'lead': 8,\n",
       "                               'learn': 1,\n",
       "                               'lease': 1,\n",
       "                               'leave': 6,\n",
       "                               'lessen': 1,\n",
       "                               'let': 6,\n",
       "                               'license': 1,\n",
       "                               'lift': 4,\n",
       "                               'like': 8,\n",
       "                               'limit': 4,\n",
       "                               'link': 2,\n",
       "                               'live': 2,\n",
       "                               'load': 2,\n",
       "                               'lock': 1,\n",
       "                               'log': 1,\n",
       "                               'look': 4,\n",
       "                               'lose': 2,\n",
       "                               'lure': 2,\n",
       "                               'maintain': 2,\n",
       "                               'make': 63,\n",
       "                               'manipulate': 1,\n",
       "                               'manufacture': 2,\n",
       "                               'map': 1,\n",
       "                               'match': 2,\n",
       "                               'matter': 1,\n",
       "                               'mature': 4,\n",
       "                               'maximize': 2,\n",
       "                               'mean': 3,\n",
       "                               'measure': 1,\n",
       "                               'meet': 9,\n",
       "                               'mend': 1,\n",
       "                               'mention': 2,\n",
       "                               'merge': 2,\n",
       "                               'merit': 1,\n",
       "                               'migrate': 1,\n",
       "                               'mind': 1,\n",
       "                               'mitigate': 1,\n",
       "                               'modify': 2,\n",
       "                               'monopolize': 1,\n",
       "                               'mount': 1,\n",
       "                               'move': 8,\n",
       "                               'name': 1,\n",
       "                               'need': 1,\n",
       "                               'negotiate': 4,\n",
       "                               'nominate': 2,\n",
       "                               'note': 1,\n",
       "                               'notify': 1,\n",
       "                               'obtain': 3,\n",
       "                               'occur': 5,\n",
       "                               'offend': 1,\n",
       "                               'offer': 6,\n",
       "                               'offset': 4,\n",
       "                               'open': 2,\n",
       "                               'operate': 6,\n",
       "                               'oppose': 1,\n",
       "                               'oust': 1,\n",
       "                               'outbid': 1,\n",
       "                               'overcome': 1,\n",
       "                               'overlap': 1,\n",
       "                               'override': 1,\n",
       "                               'oversee': 1,\n",
       "                               'own': 6,\n",
       "                               'pair': 1,\n",
       "                               'panic': 1,\n",
       "                               'parallel': 1,\n",
       "                               'participate': 2,\n",
       "                               'pass': 4,\n",
       "                               'pay': 28,\n",
       "                               'penetrate': 1,\n",
       "                               'perform': 3,\n",
       "                               'permit': 2,\n",
       "                               'persuade': 2,\n",
       "                               'phase': 1,\n",
       "                               'photocopy': 1,\n",
       "                               'pick': 2,\n",
       "                               'place': 1,\n",
       "                               'plan': 1,\n",
       "                               'play': 3,\n",
       "                               'please': 1,\n",
       "                               'point': 1,\n",
       "                               'polish': 1,\n",
       "                               'pose': 2,\n",
       "                               'position': 1,\n",
       "                               'post': 2,\n",
       "                               'pour': 1,\n",
       "                               'preclude': 1,\n",
       "                               'predict': 1,\n",
       "                               'predispose': 1,\n",
       "                               'prepare': 1,\n",
       "                               'prescribe': 1,\n",
       "                               'present': 1,\n",
       "                               'pressure': 2,\n",
       "                               'prevent': 10,\n",
       "                               'print': 6,\n",
       "                               'produce': 8,\n",
       "                               'profit': 3,\n",
       "                               'project': 1,\n",
       "                               'promote': 2,\n",
       "                               'propagandize': 1,\n",
       "                               'prosecute': 1,\n",
       "                               'protect': 3,\n",
       "                               'prove': 8,\n",
       "                               'provide': 12,\n",
       "                               'provoke': 2,\n",
       "                               'publish': 2,\n",
       "                               'pull': 1,\n",
       "                               'punish': 1,\n",
       "                               'purchase': 2,\n",
       "                               'pursue': 5,\n",
       "                               'push': 3,\n",
       "                               'put': 10,\n",
       "                               'qualify': 2,\n",
       "                               'question': 1,\n",
       "                               'quote': 1,\n",
       "                               'raise': 17,\n",
       "                               'range': 1,\n",
       "                               'rate': 1,\n",
       "                               'reach': 2,\n",
       "                               'read': 6,\n",
       "                               'realestate': 1,\n",
       "                               'realize': 4,\n",
       "                               'reallocate': 1,\n",
       "                               'reap': 1,\n",
       "                               'rebound': 1,\n",
       "                               'rebuild': 1,\n",
       "                               'recall': 1,\n",
       "                               'receive': 12,\n",
       "                               'reclaim': 1,\n",
       "                               'recognize': 2,\n",
       "                               'recommend': 2,\n",
       "                               'record': 3,\n",
       "                               'recover': 2,\n",
       "                               'recruit': 1,\n",
       "                               'red-flag': 1,\n",
       "                               'redeem': 2,\n",
       "                               'redeploy': 1,\n",
       "                               'redistribute': 1,\n",
       "                               'reduce': 13,\n",
       "                               'refile': 1,\n",
       "                               'reflect': 3,\n",
       "                               'refund': 3,\n",
       "                               'regenerate': 1,\n",
       "                               'regulate': 2,\n",
       "                               'reject': 2,\n",
       "                               'relieve': 1,\n",
       "                               'remain': 12,\n",
       "                               'remove': 3,\n",
       "                               'renew': 2,\n",
       "                               'reopen': 3,\n",
       "                               'repay': 1,\n",
       "                               'replace': 5,\n",
       "                               'replicate': 1,\n",
       "                               'report': 9,\n",
       "                               'represent': 2,\n",
       "                               'reprint': 1,\n",
       "                               'reprove': 1,\n",
       "                               'require': 8,\n",
       "                               'resign': 1,\n",
       "                               'resist': 2,\n",
       "                               'resolve': 3,\n",
       "                               'resonate': 1,\n",
       "                               'respond': 2,\n",
       "                               'restore': 3,\n",
       "                               'restructure': 1,\n",
       "                               'resubmit': 1,\n",
       "                               'result': 14,\n",
       "                               'resume': 1,\n",
       "                               'retain': 3,\n",
       "                               'retard': 1,\n",
       "                               'return': 5,\n",
       "                               'review': 4,\n",
       "                               'revive': 3,\n",
       "                               'reward': 2,\n",
       "                               'rewrite': 2,\n",
       "                               'ring': 3,\n",
       "                               'rise': 8,\n",
       "                               'risk': 5,\n",
       "                               'roll': 2,\n",
       "                               'rule': 2,\n",
       "                               'run': 8,\n",
       "                               'sabotage': 1,\n",
       "                               'sacrifice': 1,\n",
       "                               'save': 2,\n",
       "                               'say': 19,\n",
       "                               'scoop': 1,\n",
       "                               'scrape': 1,\n",
       "                               'scream': 1,\n",
       "                               'scuttle': 1,\n",
       "                               'secede': 1,\n",
       "                               'seduce': 1,\n",
       "                               'see': 25,\n",
       "                               'seek': 13,\n",
       "                               'seem': 2,\n",
       "                               'seize': 2,\n",
       "                               'select': 1,\n",
       "                               'sell': 36,\n",
       "                               'send': 5,\n",
       "                               'serve': 4,\n",
       "                               'set': 6,\n",
       "                               'settle': 6,\n",
       "                               'sew': 1,\n",
       "                               'shake': 1,\n",
       "                               'share': 3,\n",
       "                               'ship': 2,\n",
       "                               'shoot': 1,\n",
       "                               'shore': 1,\n",
       "                               'show': 2,\n",
       "                               'shrug': 1,\n",
       "                               'shut': 2,\n",
       "                               'sidestep': 1,\n",
       "                               'sign': 3,\n",
       "                               'signal': 4,\n",
       "                               'single': 1,\n",
       "                               'sink': 2,\n",
       "                               'sit': 1,\n",
       "                               'slash': 1,\n",
       "                               'sleep': 2,\n",
       "                               'slide': 1,\n",
       "                               'slip': 1,\n",
       "                               'slow': 6,\n",
       "                               'sound': 1,\n",
       "                               'spackle': 1,\n",
       "                               'spark': 2,\n",
       "                               'speak': 1,\n",
       "                               'specialize': 1,\n",
       "                               'specify': 3,\n",
       "                               'speculate': 1,\n",
       "                               'speed': 1,\n",
       "                               'spend': 3,\n",
       "                               'split': 1,\n",
       "                               'spread': 2,\n",
       "                               'spur': 2,\n",
       "                               'stake': 1,\n",
       "                               'stand': 2,\n",
       "                               'start': 3,\n",
       "                               'stay': 5,\n",
       "                               'steal': 1,\n",
       "                               'stem': 2,\n",
       "                               'step': 2,\n",
       "                               'stick': 1,\n",
       "                               'stifle': 1,\n",
       "                               'stop': 5,\n",
       "                               'store': 1,\n",
       "                               'strike': 2,\n",
       "                               'string': 1,\n",
       "                               'strip': 1,\n",
       "                               'study': 2,\n",
       "                               'submit': 2,\n",
       "                               'subscribe': 1,\n",
       "                               'subsidize': 1,\n",
       "                               'succeed': 5,\n",
       "                               'sue': 1,\n",
       "                               'suffer': 4,\n",
       "                               'suggest': 1,\n",
       "                               'suit': 1,\n",
       "                               'supply': 1,\n",
       "                               'support': 10,\n",
       "                               'surge': 1,\n",
       "                               'survive': 2,\n",
       "                               'suspect': 1,\n",
       "                               'suspend': 3,\n",
       "                               'swallow': 1,\n",
       "                               'swap': 2,\n",
       "                               'sweeten': 1,\n",
       "                               'swing': 1,\n",
       "                               'switch': 1,\n",
       "                               'tackle': 1,\n",
       "                               'take': 43,\n",
       "                               'talk': 4,\n",
       "                               'taper': 1,\n",
       "                               'target': 2,\n",
       "                               'teach': 2,\n",
       "                               'telephone': 1,\n",
       "                               'tender': 1,\n",
       "                               'test': 1,\n",
       "                               'testify': 1,\n",
       "                               'think': 9,\n",
       "                               'thwart': 1,\n",
       "                               'tilt': 1,\n",
       "                               'time': 1,\n",
       "                               'tinker': 1,\n",
       "                               'tip': 1,\n",
       "                               'tolerate': 2,\n",
       "                               'top': 1,\n",
       "                               'total': 2,\n",
       "                               'tote': 1,\n",
       "                               'touch': 1,\n",
       "                               'trade': 7,\n",
       "                               'trail': 1,\n",
       "                               'train': 2,\n",
       "                               'transfer': 1,\n",
       "                               'trash': 1,\n",
       "                               'travel': 1,\n",
       "                               'treat': 4,\n",
       "                               'trim': 1,\n",
       "                               'trust': 1,\n",
       "                               'try': 3,\n",
       "                               'tuck': 1,\n",
       "                               'turn': 6,\n",
       "                               'underline': 1,\n",
       "                               'underpin': 1,\n",
       "                               'understand': 2,\n",
       "                               'undo': 1,\n",
       "                               'unload': 1,\n",
       "                               'unveil': 2,\n",
       "                               'unwind': 1,\n",
       "                               'uptick': 1,\n",
       "                               'use': 13,\n",
       "                               'usurp': 1,\n",
       "                               'vary': 2,\n",
       "                               'veto': 5,\n",
       "                               'view': 1,\n",
       "                               'violate': 4,\n",
       "                               'vote': 3,\n",
       "                               'wait': 4,\n",
       "                               'waive': 1,\n",
       "                               'want': 13,\n",
       "                               'ward': 2,\n",
       "                               'watch': 4,\n",
       "                               'weaken': 2,\n",
       "                               'wear': 1,\n",
       "                               'weather': 1,\n",
       "                               'weigh': 1,\n",
       "                               'welcome': 2,\n",
       "                               'whipsaw': 1,\n",
       "                               'wield': 1,\n",
       "                               'win': 10,\n",
       "                               'wish': 2,\n",
       "                               'withdraw': 3,\n",
       "                               'withhold': 2,\n",
       "                               'withstand': 2,\n",
       "                               'work': 7,\n",
       "                               'worry': 1,\n",
       "                               'worsen': 1,\n",
       "                               'write': 2,\n",
       "                               'yield': 28,\n",
       "                               'zip': 1}),\n",
       "                     'VBD': FreqDist({'Asked': 1,\n",
       "                               'CHANGED': 1,\n",
       "                               'Died': 1,\n",
       "                               'ENDED': 1,\n",
       "                               'acceded': 1,\n",
       "                               'accelerated': 1,\n",
       "                               'accepted': 2,\n",
       "                               'accused': 3,\n",
       "                               'acquired': 7,\n",
       "                               'acted': 1,\n",
       "                               'adapted': 1,\n",
       "                               'added': 38,\n",
       "                               'admitted': 2,\n",
       "                               'adopted': 2,\n",
       "                               'advanced': 8,\n",
       "                               'advised': 1,\n",
       "                               'advocated': 1,\n",
       "                               'aggravated': 1,\n",
       "                               'agreed': 11,\n",
       "                               'aimed': 1,\n",
       "                               'aired': 1,\n",
       "                               'alleged': 1,\n",
       "                               'allowed': 2,\n",
       "                               'amounted': 3,\n",
       "                               'angered': 1,\n",
       "                               'announced': 14,\n",
       "                               'annoyed': 1,\n",
       "                               'anticipated': 2,\n",
       "                               'appeared': 6,\n",
       "                               'applied': 2,\n",
       "                               'approached': 1,\n",
       "                               'approved': 14,\n",
       "                               'argued': 3,\n",
       "                               'arranged': 1,\n",
       "                               'arrived': 1,\n",
       "                               'asked': 9,\n",
       "                               'assassinated': 1,\n",
       "                               'asserted': 2,\n",
       "                               'assumed': 1,\n",
       "                               'assured': 1,\n",
       "                               'attached': 1,\n",
       "                               'attempted': 1,\n",
       "                               'attended': 1,\n",
       "                               'attributed': 4,\n",
       "                               'authorized': 1,\n",
       "                               'averaged': 1,\n",
       "                               'awarded': 1,\n",
       "                               'backed': 1,\n",
       "                               'balked': 2,\n",
       "                               'banned': 1,\n",
       "                               'barred': 3,\n",
       "                               'beat': 1,\n",
       "                               'became': 17,\n",
       "                               'befell': 1,\n",
       "                               'befuddled': 1,\n",
       "                               'began': 32,\n",
       "                               'begot': 1,\n",
       "                               'believed': 3,\n",
       "                               'benefited': 3,\n",
       "                               'bid': 5,\n",
       "                               'billed': 1,\n",
       "                               'blamed': 1,\n",
       "                               'bled': 1,\n",
       "                               'blurred': 1,\n",
       "                               'booked': 1,\n",
       "                               'boosted': 4,\n",
       "                               'bothered': 1,\n",
       "                               'bought': 8,\n",
       "                               'bounced': 1,\n",
       "                               'bowed': 2,\n",
       "                               'breathed': 1,\n",
       "                               'bribed': 1,\n",
       "                               'brightened': 1,\n",
       "                               'broadened': 1,\n",
       "                               'broke': 1,\n",
       "                               'brought': 3,\n",
       "                               'brushed': 1,\n",
       "                               'built': 4,\n",
       "                               'called': 7,\n",
       "                               'came': 21,\n",
       "                               'cared': 1,\n",
       "                               'carried': 2,\n",
       "                               'caused': 4,\n",
       "                               'cautioned': 2,\n",
       "                               'changed': 6,\n",
       "                               'chastised': 1,\n",
       "                               'chose': 1,\n",
       "                               'circulated': 1,\n",
       "                               'cited': 8,\n",
       "                               'claimed': 2,\n",
       "                               'cleared': 1,\n",
       "                               'clicked': 1,\n",
       "                               'climbed': 4,\n",
       "                               'clipped': 1,\n",
       "                               'closed': 25,\n",
       "                               'co-founded': 1,\n",
       "                               'collaborated': 1,\n",
       "                               'collapsed': 1,\n",
       "                               'committed': 1,\n",
       "                               'compared': 1,\n",
       "                               'complained': 3,\n",
       "                               'completed': 9,\n",
       "                               'concentrated': 2,\n",
       "                               'concluded': 4,\n",
       "                               'condemned': 1,\n",
       "                               'confirmed': 3,\n",
       "                               'consented': 10,\n",
       "                               'contained': 4,\n",
       "                               'continued': 8,\n",
       "                               'contracted': 2,\n",
       "                               'contributed': 6,\n",
       "                               'controlled': 1,\n",
       "                               'copied': 1,\n",
       "                               'covered': 1,\n",
       "                               'cranked': 1,\n",
       "                               'created': 4,\n",
       "                               'criticized': 2,\n",
       "                               'curled': 1,\n",
       "                               'curtailed': 1,\n",
       "                               'cut': 10,\n",
       "                               'damaged': 1,\n",
       "                               'decided': 13,\n",
       "                               'declared': 4,\n",
       "                               'declined': 22,\n",
       "                               'decried': 1,\n",
       "                               'deemed': 1,\n",
       "                               'defeated': 1,\n",
       "                               'defended': 2,\n",
       "                               'denied': 1,\n",
       "                               'depended': 1,\n",
       "                               'described': 4,\n",
       "                               'determined': 1,\n",
       "                               'developed': 4,\n",
       "                               'devised': 1,\n",
       "                               'devoted': 1,\n",
       "                               'did': 62,\n",
       "                               'died': 2,\n",
       "                               'disagreed': 1,\n",
       "                               'disciplined': 1,\n",
       "                               'disclosed': 3,\n",
       "                               'discovered': 1,\n",
       "                               'discussed': 1,\n",
       "                               'dismissed': 2,\n",
       "                               'disposed': 1,\n",
       "                               'distinguished': 1,\n",
       "                               'dominated': 1,\n",
       "                               'doubled': 3,\n",
       "                               'doubted': 2,\n",
       "                               'downgraded': 1,\n",
       "                               'dreamed': 1,\n",
       "                               'dreamt': 1,\n",
       "                               'drew': 1,\n",
       "                               'drifted': 2,\n",
       "                               'drooled': 1,\n",
       "                               'dropped': 12,\n",
       "                               'drove': 2,\n",
       "                               'dubbed': 1,\n",
       "                               'dumped': 2,\n",
       "                               'earned': 10,\n",
       "                               'eased': 3,\n",
       "                               'edged': 2,\n",
       "                               'eliminated': 1,\n",
       "                               'emerged': 1,\n",
       "                               'emphasized': 1,\n",
       "                               'enabled': 1,\n",
       "                               'ended': 21,\n",
       "                               'endorsed': 1,\n",
       "                               'enraged': 1,\n",
       "                               'entered': 2,\n",
       "                               'enticed': 1,\n",
       "                               'entitled': 1,\n",
       "                               'escaped': 1,\n",
       "                               'established': 1,\n",
       "                               'estimated': 8,\n",
       "                               'evaluated': 1,\n",
       "                               'evaporated': 1,\n",
       "                               'evolved': 1,\n",
       "                               'examined': 1,\n",
       "                               'exceeded': 1,\n",
       "                               'expanded': 4,\n",
       "                               'expelled': 1,\n",
       "                               'expired': 1,\n",
       "                               'explained': 3,\n",
       "                               'exploded': 1,\n",
       "                               'expressed': 3,\n",
       "                               'extended': 2,\n",
       "                               'exuded': 1,\n",
       "                               'failed': 10,\n",
       "                               'faltered': 1,\n",
       "                               'fared': 3,\n",
       "                               'favored': 1,\n",
       "                               'feared': 2,\n",
       "                               'featured': 2,\n",
       "                               'fed': 1,\n",
       "                               'fell': 32,\n",
       "                               'felt': 4,\n",
       "                               'fielded': 1,\n",
       "                               'filed': 4,\n",
       "                               'finished': 4,\n",
       "                               'fired': 3,\n",
       "                               'firmed': 1,\n",
       "                               'fled': 1,\n",
       "                               'folded': 1,\n",
       "                               'followed': 6,\n",
       "                               'forced': 2,\n",
       "                               'forecast': 1,\n",
       "                               'formed': 1,\n",
       "                               'fought': 1,\n",
       "                               'found': 13,\n",
       "                               'fretted': 1,\n",
       "                               'fueled': 1,\n",
       "                               'gained': 15,\n",
       "                               'gave': 10,\n",
       "                               'got': 11,\n",
       "                               'graduated': 1,\n",
       "                               'grew': 4,\n",
       "                               'guided': 1,\n",
       "                               'had': 160,\n",
       "                               'halted': 1,\n",
       "                               'hampered': 1,\n",
       "                               'handed': 1,\n",
       "                               'happened': 1,\n",
       "                               'harped': 1,\n",
       "                               'hauled': 1,\n",
       "                               'have': 1,\n",
       "                               'heard': 1,\n",
       "                               'held': 3,\n",
       "                               'helped': 8,\n",
       "                               'hid': 1,\n",
       "                               'hired': 3,\n",
       "                               'hit': 3,\n",
       "                               'hoped': 1,\n",
       "                               'hosted': 1,\n",
       "                               'hung': 1,\n",
       "                               'identified': 3,\n",
       "                               'ignored': 1,\n",
       "                               'implied': 1,\n",
       "                               'imported': 2,\n",
       "                               'imposed': 2,\n",
       "                               'inched': 2,\n",
       "                               'included': 14,\n",
       "                               'increased': 9,\n",
       "                               'indicated': 10,\n",
       "                               'inherited': 1,\n",
       "                               'insisted': 3,\n",
       "                               'inspired': 2,\n",
       "                               'intended': 1,\n",
       "                               'introduced': 7,\n",
       "                               'invented': 1,\n",
       "                               'invested': 1,\n",
       "                               'involved': 3,\n",
       "                               'issued': 3,\n",
       "                               'joined': 4,\n",
       "                               'jumped': 5,\n",
       "                               'kept': 4,\n",
       "                               'kicked': 1,\n",
       "                               'killed': 2,\n",
       "                               'knew': 3,\n",
       "                               'knocked': 1,\n",
       "                               'lacked': 1,\n",
       "                               'lasted': 1,\n",
       "                               'lauded': 1,\n",
       "                               'launched': 5,\n",
       "                               'lay': 1,\n",
       "                               'leapt': 1,\n",
       "                               'learned': 3,\n",
       "                               'led': 7,\n",
       "                               'left': 3,\n",
       "                               'lengthened': 1,\n",
       "                               'lent': 1,\n",
       "                               'let': 1,\n",
       "                               'licensed': 1,\n",
       "                               'lifted': 1,\n",
       "                               'limited': 1,\n",
       "                               'lost': 10,\n",
       "                               'loved': 2,\n",
       "                               'lowered': 2,\n",
       "                               'made': 23,\n",
       "                               'maintained': 3,\n",
       "                               'managed': 1,\n",
       "                               'marketed': 1,\n",
       "                               'matched': 3,\n",
       "                               'materialized': 1,\n",
       "                               'meant': 2,\n",
       "                               'merged': 1,\n",
       "                               'met': 3,\n",
       "                               'mixed': 1,\n",
       "                               'mounted': 1,\n",
       "                               'moved': 3,\n",
       "                               'named': 2,\n",
       "                               'narrowed': 2,\n",
       "                               'needed': 5,\n",
       "                               'negotiated': 1,\n",
       "                               'nominated': 1,\n",
       "                               'notched': 1,\n",
       "                               'noted': 22,\n",
       "                               'numbered': 1,\n",
       "                               'obligated': 1,\n",
       "                               'observed': 1,\n",
       "                               'obtained': 1,\n",
       "                               'occurred': 3,\n",
       "                               'offered': 16,\n",
       "                               'omitted': 1,\n",
       "                               'opened': 5,\n",
       "                               'opposed': 2,\n",
       "                               'ordered': 4,\n",
       "                               'outnumbered': 1,\n",
       "                               'overvalued': 1,\n",
       "                               'owed': 2,\n",
       "                               'paid': 5,\n",
       "                               'participated': 1,\n",
       "                               'passed': 4,\n",
       "                               'patented': 1,\n",
       "                               'picked': 1,\n",
       "                               'placed': 2,\n",
       "                               'planned': 5,\n",
       "                               'pleaded': 2,\n",
       "                               'pledged': 1,\n",
       "                               'plugged': 1,\n",
       "                               'plummeted': 1,\n",
       "                               'plunged': 5,\n",
       "                               'pointed': 2,\n",
       "                               'polled': 1,\n",
       "                               'possessed': 1,\n",
       "                               'posted': 11,\n",
       "                               'poured': 1,\n",
       "                               'praised': 2,\n",
       "                               'predicted': 3,\n",
       "                               'preferred': 1,\n",
       "                               'presented': 1,\n",
       "                               'printed': 1,\n",
       "                               'produced': 2,\n",
       "                               'profited': 1,\n",
       "                               'prompted': 3,\n",
       "                               'proposed': 10,\n",
       "                               'proved': 1,\n",
       "                               'provided': 1,\n",
       "                               'published': 1,\n",
       "                               'pulled': 1,\n",
       "                               'purchased': 2,\n",
       "                               'pushed': 1,\n",
       "                               'put': 3,\n",
       "                               'questioned': 1,\n",
       "                               'quipped': 1,\n",
       "                               'quoted': 1,\n",
       "                               'raced': 1,\n",
       "                               'raised': 9,\n",
       "                               'ran': 6,\n",
       "                               'rang': 1,\n",
       "                               'ranged': 2,\n",
       "                               'ranked': 1,\n",
       "                               'rated': 1,\n",
       "                               'reached': 4,\n",
       "                               'reacted': 1,\n",
       "                               'read': 2,\n",
       "                               'reaffirmed': 1,\n",
       "                               'realized': 4,\n",
       "                               'rebuffed': 1,\n",
       "                               'rebuked': 1,\n",
       "                               'received': 12,\n",
       "                               'recommended': 1,\n",
       "                               'recorded': 1,\n",
       "                               'recovered': 2,\n",
       "                               'reduced': 4,\n",
       "                               'referred': 4,\n",
       "                               'reflected': 3,\n",
       "                               'refused': 3,\n",
       "                               'registered': 1,\n",
       "                               'rejected': 7,\n",
       "                               'released': 2,\n",
       "                               'remained': 5,\n",
       "                               'remarked': 1,\n",
       "                               'reminded': 1,\n",
       "                               'removed': 1,\n",
       "                               'renewed': 1,\n",
       "                               'reopened': 1,\n",
       "                               'replaced': 1,\n",
       "                               'reported': 25,\n",
       "                               'represented': 2,\n",
       "                               'required': 1,\n",
       "                               'reserved': 1,\n",
       "                               'resigned': 5,\n",
       "                               'resolved': 1,\n",
       "                               'responded': 3,\n",
       "                               'restored': 1,\n",
       "                               'restructured': 1,\n",
       "                               'resulted': 1,\n",
       "                               'retired': 1,\n",
       "                               'retraced': 1,\n",
       "                               'returned': 2,\n",
       "                               'reversed': 1,\n",
       "                               'reviewed': 1,\n",
       "                               'rolled': 1,\n",
       "                               'rose': 61,\n",
       "                               'ruled': 4,\n",
       "                               'rushed': 2,\n",
       "                               'sacked': 1,\n",
       "                               'sagged': 1,\n",
       "                               'said': 614,\n",
       "                               'sank': 1,\n",
       "                               'saved': 1,\n",
       "                               'saw': 5,\n",
       "                               'scheduled': 1,\n",
       "                               'scrambled': 1,\n",
       "                               'screened': 1,\n",
       "                               'screwed': 1,\n",
       "                               'searched': 1,\n",
       "                               'secured': 1,\n",
       "                               'seemed': 7,\n",
       "                               'seized': 1,\n",
       "                               'sent': 2,\n",
       "                               'served': 1,\n",
       "                               'set': 6,\n",
       "                               'settled': 3,\n",
       "                               'shed': 1,\n",
       "                               'shopped': 1,\n",
       "                               'shot': 1,\n",
       "                               'showed': 13,\n",
       "                               'shrank': 2,\n",
       "                               'signed': 2,\n",
       "                               'skidded': 1,\n",
       "                               'skipped': 1,\n",
       "                               'slid': 2,\n",
       "                               'slipped': 4,\n",
       "                               'snapped': 2,\n",
       "                               'sneaked': 1,\n",
       "                               'soared': 4,\n",
       "                               'sold': 14,\n",
       "                               'solved': 1,\n",
       "                               'sought': 4,\n",
       "                               'sounded': 2,\n",
       "                               'sparked': 3,\n",
       "                               'speculated': 3,\n",
       "                               'spent': 4,\n",
       "                               'spoke': 1,\n",
       "                               'spotted': 1,\n",
       "                               'spurned': 1,\n",
       "                               'sputtered': 1,\n",
       "                               'squeezed': 1,\n",
       "                               'started': 4,\n",
       "                               'stated': 1,\n",
       "                               'stayed': 1,\n",
       "                               'stemmed': 1,\n",
       "                               'stepped': 2,\n",
       "                               'stirred': 1,\n",
       "                               'stood': 5,\n",
       "                               'stopped': 4,\n",
       "                               'stored': 2,\n",
       "                               'strengthened': 1,\n",
       "                               'stressed': 1,\n",
       "                               'stretched': 1,\n",
       "                               'struggled': 1,\n",
       "                               'stuck': 1,\n",
       "                               'studied': 1,\n",
       "                               'succeeded': 2,\n",
       "                               'sued': 2,\n",
       "                               'suffered': 2,\n",
       "                               'suggested': 6,\n",
       "                               'summoned': 1,\n",
       "                               'supported': 1,\n",
       "                               'surfaced': 1,\n",
       "                               'surged': 6,\n",
       "                               'surrendered': 3,\n",
       "                               'suspended': 2,\n",
       "                               'sweetened': 1,\n",
       "                               'switched': 1,\n",
       "                               'taught': 3,\n",
       "                               'tempted': 1,\n",
       "                               'termed': 1,\n",
       "                               'terminated': 1,\n",
       "                               'thought': 5,\n",
       "                               'threatened': 1,\n",
       "                               'tied': 1,\n",
       "                               'told': 12,\n",
       "                               'took': 28,\n",
       "                               'totaled': 10,\n",
       "                               'touched': 1,\n",
       "                               'traced': 1,\n",
       "                               'trailed': 3,\n",
       "                               'transformed': 1,\n",
       "                               'traveled': 1,\n",
       "                               'treated': 1,\n",
       "                               'tried': 3,\n",
       "                               'triggered': 1,\n",
       "                               'tripled': 1,\n",
       "                               'tumbled': 3,\n",
       "                               'turned': 7,\n",
       "                               'understood': 1,\n",
       "                               'underwent': 2,\n",
       "                               'unleashed': 1,\n",
       "                               'unveiled': 3,\n",
       "                               'upheld': 2,\n",
       "                               'urged': 5,\n",
       "                               'used': 4,\n",
       "                               'ushered': 1,\n",
       "                               'varied': 1,\n",
       "                               'ventilated': 1,\n",
       "                               'viewed': 1,\n",
       "                               'violated': 2,\n",
       "                               'visited': 1,\n",
       "                               'voted': 3,\n",
       "                               'vowed': 1,\n",
       "                               'waited': 1,\n",
       "                               'waived': 1,\n",
       "                               'wanted': 12,\n",
       "                               'warned': 2,\n",
       "                               'was': 367,\n",
       "                               'weighed': 2,\n",
       "                               'welcomed': 1,\n",
       "                               'went': 14,\n",
       "                               'were': 197,\n",
       "                               'withdrew': 1,\n",
       "                               'won': 9,\n",
       "                               'worked': 5,\n",
       "                               'wound': 1,\n",
       "                               'wrote': 9,\n",
       "                               'yielded': 1}),\n",
       "                     'VBG': FreqDist({'According': 8,\n",
       "                               'Adopting': 1,\n",
       "                               'Advancing': 1,\n",
       "                               'Arbitraging': 1,\n",
       "                               'Assuming': 2,\n",
       "                               'Beginning': 1,\n",
       "                               'Being': 1,\n",
       "                               'Bucking': 1,\n",
       "                               'Buying': 3,\n",
       "                               'Citing': 1,\n",
       "                               'Continuing': 1,\n",
       "                               'DIALING': 1,\n",
       "                               'Declining': 1,\n",
       "                               'Defending': 1,\n",
       "                               'Depending': 1,\n",
       "                               'Determining': 1,\n",
       "                               'Encouraging': 1,\n",
       "                               'Excluding': 2,\n",
       "                               'Filling': 1,\n",
       "                               'Following': 1,\n",
       "                               'Getting': 1,\n",
       "                               'Having': 1,\n",
       "                               'Judging': 1,\n",
       "                               'Knowing': 1,\n",
       "                               'Legislating': 1,\n",
       "                               'Moving': 1,\n",
       "                               'Observing': 1,\n",
       "                               'Offering': 1,\n",
       "                               'PORTING': 1,\n",
       "                               'Performing': 1,\n",
       "                               'Reducing': 1,\n",
       "                               'SWITCHING': 1,\n",
       "                               'Standing': 1,\n",
       "                               'Starting': 1,\n",
       "                               'TRIMMING': 1,\n",
       "                               'Taking': 2,\n",
       "                               'Winning': 1,\n",
       "                               'abating': 1,\n",
       "                               'abolishing': 1,\n",
       "                               'abounding': 1,\n",
       "                               'abridging': 1,\n",
       "                               'accepting': 3,\n",
       "                               'according': 34,\n",
       "                               'accounting': 1,\n",
       "                               'accusing': 1,\n",
       "                               'achieving': 1,\n",
       "                               'acknowledging': 1,\n",
       "                               'acquiring': 2,\n",
       "                               'adapting': 1,\n",
       "                               'adding': 3,\n",
       "                               'addressing': 1,\n",
       "                               'adjusting': 2,\n",
       "                               'admitting': 6,\n",
       "                               'advancing': 2,\n",
       "                               'advertising': 3,\n",
       "                               'advocating': 1,\n",
       "                               'affecting': 1,\n",
       "                               'agreeing': 1,\n",
       "                               'ailing': 2,\n",
       "                               'aiming': 1,\n",
       "                               'alleging': 2,\n",
       "                               'altering': 1,\n",
       "                               'amending': 1,\n",
       "                               'anticipating': 1,\n",
       "                               'apologizing': 1,\n",
       "                               'appealing': 2,\n",
       "                               'appearing': 1,\n",
       "                               'arguing': 2,\n",
       "                               'arising': 1,\n",
       "                               'asking': 7,\n",
       "                               'asserting': 1,\n",
       "                               'assuming': 5,\n",
       "                               'attacking': 1,\n",
       "                               'attempting': 5,\n",
       "                               'attending': 1,\n",
       "                               'attracting': 1,\n",
       "                               'authorizing': 1,\n",
       "                               'avoiding': 1,\n",
       "                               'awarding': 1,\n",
       "                               'backing': 1,\n",
       "                               'banking': 2,\n",
       "                               'banning': 2,\n",
       "                               'barking': 1,\n",
       "                               'bearing': 2,\n",
       "                               'becoming': 6,\n",
       "                               'beginning': 7,\n",
       "                               'behaving': 1,\n",
       "                               'being': 33,\n",
       "                               'belonging': 2,\n",
       "                               'betting': 1,\n",
       "                               'boarding': 1,\n",
       "                               'bombarding': 1,\n",
       "                               'booming': 3,\n",
       "                               'boosting': 1,\n",
       "                               'borrowing': 1,\n",
       "                               'breaking': 1,\n",
       "                               'bribing': 1,\n",
       "                               'bringing': 1,\n",
       "                               'broadcasting': 1,\n",
       "                               'brokering': 1,\n",
       "                               'budding': 1,\n",
       "                               'building': 5,\n",
       "                               'bundling': 1,\n",
       "                               'buying': 12,\n",
       "                               'calling': 1,\n",
       "                               'carrying': 1,\n",
       "                               'cascading': 1,\n",
       "                               'casting': 2,\n",
       "                               'causing': 5,\n",
       "                               'challenging': 1,\n",
       "                               'championing': 1,\n",
       "                               'changing': 3,\n",
       "                               'characterizing': 1,\n",
       "                               'charging': 1,\n",
       "                               'checking': 1,\n",
       "                               'choosing': 2,\n",
       "                               'citing': 4,\n",
       "                               'claiming': 2,\n",
       "                               'clearing': 1,\n",
       "                               'climbing': 2,\n",
       "                               'closing': 3,\n",
       "                               'collecting': 1,\n",
       "                               'coming': 16,\n",
       "                               'commenting': 1,\n",
       "                               'committing': 1,\n",
       "                               'competing': 2,\n",
       "                               'complaining': 1,\n",
       "                               'completing': 1,\n",
       "                               'conceding': 1,\n",
       "                               'concentrating': 1,\n",
       "                               'condemning': 1,\n",
       "                               'conducting': 2,\n",
       "                               'considering': 4,\n",
       "                               'consisting': 1,\n",
       "                               'containing': 1,\n",
       "                               'contesting': 1,\n",
       "                               'continuing': 13,\n",
       "                               'contributing': 2,\n",
       "                               'controlling': 3,\n",
       "                               'converting': 1,\n",
       "                               'cooperating': 1,\n",
       "                               'copying': 1,\n",
       "                               'correcting': 1,\n",
       "                               'counting': 1,\n",
       "                               'covering': 2,\n",
       "                               'crashing': 1,\n",
       "                               'creating': 5,\n",
       "                               'crossing': 2,\n",
       "                               'cruising': 1,\n",
       "                               'crying': 1,\n",
       "                               'curbing': 1,\n",
       "                               'cutting': 5,\n",
       "                               'dating': 1,\n",
       "                               'dealing': 1,\n",
       "                               'declaring': 3,\n",
       "                               'declining': 4,\n",
       "                               'deducting': 1,\n",
       "                               'defying': 1,\n",
       "                               'deliberating': 1,\n",
       "                               'delivering': 1,\n",
       "                               'demanding': 2,\n",
       "                               'demonstrating': 1,\n",
       "                               'denouncing': 2,\n",
       "                               'denying': 6,\n",
       "                               'depending': 1,\n",
       "                               'descending': 1,\n",
       "                               'designing': 1,\n",
       "                               'deteriorating': 1,\n",
       "                               'deterring': 1,\n",
       "                               'devastating': 1,\n",
       "                               'developing': 5,\n",
       "                               'devouring': 1,\n",
       "                               'directing': 1,\n",
       "                               'disclosing': 1,\n",
       "                               'discontinuing': 1,\n",
       "                               'discouraging': 1,\n",
       "                               'discussing': 3,\n",
       "                               'disseminating': 1,\n",
       "                               'diversifying': 1,\n",
       "                               'dividing': 1,\n",
       "                               'doing': 9,\n",
       "                               'doling': 1,\n",
       "                               'dominating': 1,\n",
       "                               'drawing': 1,\n",
       "                               'drinking': 1,\n",
       "                               'driving': 3,\n",
       "                               'dwindling': 1,\n",
       "                               'earning': 1,\n",
       "                               'easing': 2,\n",
       "                               'eating': 1,\n",
       "                               'eliminating': 2,\n",
       "                               'emerging': 1,\n",
       "                               'enabling': 2,\n",
       "                               'encircling': 1,\n",
       "                               'encouraging': 2,\n",
       "                               'encroaching': 1,\n",
       "                               'ending': 8,\n",
       "                               'engaging': 1,\n",
       "                               'engineering': 1,\n",
       "                               'enjoying': 1,\n",
       "                               'entering': 2,\n",
       "                               'equaling': 1,\n",
       "                               'establishing': 1,\n",
       "                               'evaluating': 1,\n",
       "                               'evoking': 1,\n",
       "                               'exceeding': 2,\n",
       "                               'exchanging': 1,\n",
       "                               'executing': 3,\n",
       "                               'exerting': 1,\n",
       "                               'existing': 4,\n",
       "                               'expanding': 5,\n",
       "                               'expecting': 3,\n",
       "                               'experiencing': 1,\n",
       "                               'explaining': 1,\n",
       "                               'expressing': 1,\n",
       "                               'extending': 2,\n",
       "                               'eyeing': 1,\n",
       "                               'facing': 5,\n",
       "                               'factoring': 1,\n",
       "                               'failing': 4,\n",
       "                               'fainting': 1,\n",
       "                               'falling': 5,\n",
       "                               'fawning': 1,\n",
       "                               'featuring': 2,\n",
       "                               'feeling': 3,\n",
       "                               'fetching': 1,\n",
       "                               'fighting': 2,\n",
       "                               'filling': 1,\n",
       "                               'financing': 5,\n",
       "                               'finding': 2,\n",
       "                               'focusing': 2,\n",
       "                               'following': 13,\n",
       "                               'forcing': 1,\n",
       "                               'forecasting': 1,\n",
       "                               'foundering': 1,\n",
       "                               'frustrating': 1,\n",
       "                               'fuming': 1,\n",
       "                               'functioning': 1,\n",
       "                               'funding': 2,\n",
       "                               'fundraising': 1,\n",
       "                               'gaining': 4,\n",
       "                               'gauging': 1,\n",
       "                               'getting': 9,\n",
       "                               'giving': 9,\n",
       "                               'going': 20,\n",
       "                               'granting': 1,\n",
       "                               'growing': 22,\n",
       "                               'guarding': 1,\n",
       "                               'hailing': 1,\n",
       "                               'happening': 1,\n",
       "                               'hauling': 1,\n",
       "                               'having': 11,\n",
       "                               'heading': 1,\n",
       "                               'heating': 1,\n",
       "                               'helping': 6,\n",
       "                               'hitting': 2,\n",
       "                               'holding': 17,\n",
       "                               'hugging': 1,\n",
       "                               'hurting': 2,\n",
       "                               'ignoring': 3,\n",
       "                               'impeding': 1,\n",
       "                               'impending': 1,\n",
       "                               'imposing': 1,\n",
       "                               'improving': 3,\n",
       "                               'inching': 1,\n",
       "                               'including': 38,\n",
       "                               'increasing': 18,\n",
       "                               'indicating': 2,\n",
       "                               'indulging': 1,\n",
       "                               'influencing': 1,\n",
       "                               'initialing': 1,\n",
       "                               'initiating': 1,\n",
       "                               'injecting': 1,\n",
       "                               'injuring': 1,\n",
       "                               'inquiring': 1,\n",
       "                               'insinuating': 1,\n",
       "                               'installing': 1,\n",
       "                               'introducing': 2,\n",
       "                               'investigating': 3,\n",
       "                               'investing': 2,\n",
       "                               'inviting': 1,\n",
       "                               'involving': 9,\n",
       "                               'issuing': 1,\n",
       "                               'jeopardizing': 1,\n",
       "                               'joining': 3,\n",
       "                               'jumping': 1,\n",
       "                               'justifying': 1,\n",
       "                               'keeping': 5,\n",
       "                               'killing': 2,\n",
       "                               'labeling': 1,\n",
       "                               'lagging': 1,\n",
       "                               'laughing': 2,\n",
       "                               'laying': 1,\n",
       "                               'leading': 12,\n",
       "                               'leaving': 5,\n",
       "                               'lending': 2,\n",
       "                               'lessening': 1,\n",
       "                               'letting': 2,\n",
       "                               'leveling': 2,\n",
       "                               'leveraging': 1,\n",
       "                               'limiting': 2,\n",
       "                               'limping': 1,\n",
       "                               'living': 1,\n",
       "                               'loading': 1,\n",
       "                               'looking': 9,\n",
       "                               'looming': 3,\n",
       "                               'losing': 8,\n",
       "                               'lowering': 2,\n",
       "                               'lying': 5,\n",
       "                               'mailing': 1,\n",
       "                               'maintaining': 4,\n",
       "                               'making': 20,\n",
       "                               'managing': 7,\n",
       "                               'manufacturing': 8,\n",
       "                               'marching': 2,\n",
       "                               'marketing': 3,\n",
       "                               'mating': 1,\n",
       "                               'maturing': 1,\n",
       "                               'meaning': 2,\n",
       "                               'mobilizing': 1,\n",
       "                               'moving': 3,\n",
       "                               'mulling': 1,\n",
       "                               'multiplying': 1,\n",
       "                               'muscling': 1,\n",
       "                               'naming': 2,\n",
       "                               'needing': 1,\n",
       "                               'negotiating': 1,\n",
       "                               'neighboring': 1,\n",
       "                               'nonrecurring': 1,\n",
       "                               'noticing': 1,\n",
       "                               'noting': 2,\n",
       "                               'obtaining': 1,\n",
       "                               'occupying': 1,\n",
       "                               'offending': 1,\n",
       "                               'offering': 10,\n",
       "                               'offsetting': 3,\n",
       "                               'opening': 4,\n",
       "                               'operating': 11,\n",
       "                               'ordering': 1,\n",
       "                               'outlawing': 1,\n",
       "                               'overpaying': 1,\n",
       "                               'overriding': 1,\n",
       "                               'owning': 1,\n",
       "                               'packaging': 1,\n",
       "                               'passing': 2,\n",
       "                               'paying': 14,\n",
       "                               'pealing': 1,\n",
       "                               'pending': 5,\n",
       "                               'performing': 2,\n",
       "                               'permitting': 1,\n",
       "                               'phasing': 2,\n",
       "                               'photocopying': 1,\n",
       "                               'picking': 1,\n",
       "                               'pitting': 1,\n",
       "                               'placing': 2,\n",
       "                               'planning': 2,\n",
       "                               'playing': 5,\n",
       "                               'plunging': 2,\n",
       "                               'pointing': 2,\n",
       "                               'posing': 1,\n",
       "                               'posting': 2,\n",
       "                               'practicing': 1,\n",
       "                               'predicting': 4,\n",
       "                               'preserving': 2,\n",
       "                               'pressing': 1,\n",
       "                               'prevailing': 2,\n",
       "                               'preventing': 4,\n",
       "                               'producing': 4,\n",
       "                               'prohibiting': 1,\n",
       "                               'promoting': 2,\n",
       "                               'propelling': 1,\n",
       "                               'proposing': 4,\n",
       "                               'prosecuting': 1,\n",
       "                               'protecting': 4,\n",
       "                               'providing': 5,\n",
       "                               'proving': 3,\n",
       "                               'publishing': 4,\n",
       "                               'pulling': 1,\n",
       "                               'pumping': 2,\n",
       "                               'punishing': 1,\n",
       "                               'purchasing': 9,\n",
       "                               'pushing': 2,\n",
       "                               'putting': 2,\n",
       "                               'quashing': 1,\n",
       "                               'queuing': 1,\n",
       "                               'quitting': 1,\n",
       "                               'quoting': 1,\n",
       "                               'racing': 1,\n",
       "                               'raising': 7,\n",
       "                               'rallying': 1,\n",
       "                               'ranging': 1,\n",
       "                               'ratcheting': 1,\n",
       "                               'rating': 1,\n",
       "                               'reaching': 2,\n",
       "                               'reading': 1,\n",
       "                               'reaping': 1,\n",
       "                               'rebounding': 1,\n",
       "                               'rebuilding': 1,\n",
       "                               'recalling': 1,\n",
       "                               'receiving': 4,\n",
       "                               'reciting': 1,\n",
       "                               'recognizing': 1,\n",
       "                               'recommending': 1,\n",
       "                               'recovering': 1,\n",
       "                               'recruiting': 1,\n",
       "                               'redeeming': 1,\n",
       "                               'redistributing': 1,\n",
       "                               'reducing': 4,\n",
       "                               'reeling': 1,\n",
       "                               'referring': 1,\n",
       "                               'refitting': 1,\n",
       "                               'reflecting': 4,\n",
       "                               'refreshing': 1,\n",
       "                               'refunding': 1,\n",
       "                               'regarding': 5,\n",
       "                               'regulating': 2,\n",
       "                               'reinstating': 1,\n",
       "                               'relating': 1,\n",
       "                               'remaining': 9,\n",
       "                               'removing': 1,\n",
       "                               'renewing': 1,\n",
       "                               'replacing': 1,\n",
       "                               'replicating': 1,\n",
       "                               'reporting': 5,\n",
       "                               'representing': 4,\n",
       "                               'requesting': 1,\n",
       "                               'requiring': 2,\n",
       "                               'researching': 1,\n",
       "                               'reshaping': 2,\n",
       "                               'resigning': 1,\n",
       "                               'resisting': 1,\n",
       "                               'responding': 2,\n",
       "                               'restricting': 1,\n",
       "                               'restructuring': 2,\n",
       "                               'resulting': 6,\n",
       "                               'retaining': 2,\n",
       "                               'retaliating': 1,\n",
       "                               'retiring': 1,\n",
       "                               'returning': 2,\n",
       "                               'reviewing': 1,\n",
       "                               'revising': 1,\n",
       "                               'rewarding': 1,\n",
       "                               'riding': 1,\n",
       "                               'ringing': 2,\n",
       "                               'rising': 11,\n",
       "                               'rolling': 1,\n",
       "                               'running': 6,\n",
       "                               'sacrificing': 1,\n",
       "                               'safeguarding': 1,\n",
       "                               'sagging': 1,\n",
       "                               'satisfying': 1,\n",
       "                               'saving': 1,\n",
       "                               'saying': 18,\n",
       "                               'scaring': 1,\n",
       "                               'scrambling': 2,\n",
       "                               'scrutinizing': 3,\n",
       "                               'searching': 1,\n",
       "                               'seeing': 3,\n",
       "                               'seeking': 19,\n",
       "                               'segmenting': 1,\n",
       "                               'selling': 8,\n",
       "                               'sending': 2,\n",
       "                               'sentencing': 1,\n",
       "                               'servicing': 1,\n",
       "                               'serving': 3,\n",
       "                               'setting': 1,\n",
       "                               'shaping': 1,\n",
       "                               'shedding': 1,\n",
       "                               'shipping': 2,\n",
       "                               'shopping': 1,\n",
       "                               'shoring': 1,\n",
       "                               'showing': 4,\n",
       "                               'shrinking': 1,\n",
       "                               'signaling': 1,\n",
       "                               'signifying': 1,\n",
       "                               'signing': 2,\n",
       "                               'sitting': 1,\n",
       "                               'sketching': 1,\n",
       "                               'slashing': 1,\n",
       "                               'sleeping': 1,\n",
       "                               'sliding': 1,\n",
       "                               'slowing': 8,\n",
       "                               'smothering': 1,\n",
       "                               'snaking': 1,\n",
       "                               'soaring': 1,\n",
       "                               'softening': 1,\n",
       "                               'soliciting': 1,\n",
       "                               'sorting': 1,\n",
       "                               'sounding': 1,\n",
       "                               'sparing': 1,\n",
       "                               'sparking': 1,\n",
       "                               'speaking': 1,\n",
       "                               'specializing': 1,\n",
       "                               'speculating': 1,\n",
       "                               'spending': 2,\n",
       "                               'spurring': 1,\n",
       "                               'stacking': 1,\n",
       "                               'starting': 5,\n",
       "                               'staying': 1,\n",
       "                               'stemming': 3,\n",
       "                               'stepping': 3,\n",
       "                               'sticking': 1,\n",
       "                               'stimulating': 2,\n",
       "                               'stressing': 2,\n",
       "                               'stretching': 1,\n",
       "                               'striving': 1,\n",
       "                               'struggling': 3,\n",
       "                               'studying': 2,\n",
       "                               'subjecting': 1,\n",
       "                               'succeeding': 2,\n",
       "                               'suing': 2,\n",
       "                               'surrounding': 2,\n",
       "                               'surviving': 3,\n",
       "                               'swapping': 1,\n",
       "                               'sweeping': 2,\n",
       "                               'swelling': 1,\n",
       "                               'tailoring': 1,\n",
       "                               'taking': 10,\n",
       "                               'talking': 4,\n",
       "                               'tapping': 1,\n",
       "                               'targeting': 3,\n",
       "                               'teetering': 1,\n",
       "                               'telling': 3,\n",
       "                               'tendering': 1,\n",
       "                               'thinking': 5,\n",
       "                               'thumbing': 1,\n",
       "                               'tightening': 1,\n",
       "                               'totaling': 2,\n",
       "                               'tracking': 1,\n",
       "                               'trading': 18,\n",
       "                               'transacting': 2,\n",
       "                               'transferring': 2,\n",
       "                               'transforming': 1,\n",
       "                               'transporting': 1,\n",
       "                               'traveling': 2,\n",
       "                               'treating': 3,\n",
       "                               'trimming': 1,\n",
       "                               'trying': 22,\n",
       "                               'turning': 6,\n",
       "                               'twisting': 1,\n",
       "                               'undercutting': 1,\n",
       "                               'undergoing': 1,\n",
       "                               'underlying': 8,\n",
       "                               'underperforming': 1,\n",
       "                               'undertaking': 1,\n",
       "                               'upsetting': 1,\n",
       "                               'urging': 1,\n",
       "                               'ushering': 1,\n",
       "                               'using': 16,\n",
       "                               'uttering': 1,\n",
       "                               'varying': 3,\n",
       "                               'viewing': 1,\n",
       "                               'violating': 1,\n",
       "                               'visiting': 2,\n",
       "                               'waiting': 2,\n",
       "                               'waiving': 1,\n",
       "                               'walking': 1,\n",
       "                               'wallowing': 1,\n",
       "                               'wanting': 1,\n",
       "                               'warning': 3,\n",
       "                               'watching': 1,\n",
       "                               'weighing': 1,\n",
       "                               'winding': 1,\n",
       "                               'winning': 2,\n",
       "                               'wooing': 1,\n",
       "                               'working': 9,\n",
       "                               'worrying': 1,\n",
       "                               'wrecking': 1,\n",
       "                               'wrestling': 1,\n",
       "                               'writing': 3,\n",
       "                               'yielding': 3}),\n",
       "                     'VBN': FreqDist({'Absorbed': 1,\n",
       "                               'Annualized': 1,\n",
       "                               'Asked': 1,\n",
       "                               'Concerned': 1,\n",
       "                               'Confronted': 1,\n",
       "                               'Continued': 1,\n",
       "                               'Developed': 1,\n",
       "                               'Estimated': 2,\n",
       "                               'Filmed': 1,\n",
       "                               'Founded': 2,\n",
       "                               'Funded': 1,\n",
       "                               'Given': 1,\n",
       "                               'Guaranteed': 2,\n",
       "                               'Left': 1,\n",
       "                               'Named': 1,\n",
       "                               'OFFERED': 1,\n",
       "                               'Posted': 2,\n",
       "                               'Provided': 1,\n",
       "                               'Put': 1,\n",
       "                               'Rated': 1,\n",
       "                               'Reached': 1,\n",
       "                               'Regarded': 1,\n",
       "                               'Rekindled': 1,\n",
       "                               'Related': 1,\n",
       "                               'Stung': 2,\n",
       "                               'UPHELD': 1,\n",
       "                               'Used': 1,\n",
       "                               'abandoned': 3,\n",
       "                               'absorbed': 2,\n",
       "                               'accelerated': 1,\n",
       "                               'accepted': 3,\n",
       "                               'accounted': 1,\n",
       "                               'accrued': 1,\n",
       "                               'accumulated': 1,\n",
       "                               'accused': 3,\n",
       "                               'achieved': 1,\n",
       "                               'acquired': 11,\n",
       "                               'added': 2,\n",
       "                               'adjusted': 5,\n",
       "                               'adopted': 3,\n",
       "                               'advanced': 1,\n",
       "                               'advertised': 2,\n",
       "                               'advised': 1,\n",
       "                               'afflicted': 1,\n",
       "                               'agreed': 5,\n",
       "                               'aimed': 9,\n",
       "                               'alarmed': 1,\n",
       "                               'alienated': 1,\n",
       "                               'alleged': 8,\n",
       "                               'allocated': 2,\n",
       "                               'allowed': 7,\n",
       "                               'altered': 1,\n",
       "                               'amended': 1,\n",
       "                               'announced': 3,\n",
       "                               'answered': 2,\n",
       "                               'anticipated': 3,\n",
       "                               'applied': 2,\n",
       "                               'appointed': 1,\n",
       "                               'appropriated': 1,\n",
       "                               'approved': 11,\n",
       "                               'argued': 1,\n",
       "                               'armed': 1,\n",
       "                               'arrested': 1,\n",
       "                               'asked': 1,\n",
       "                               'assembled': 2,\n",
       "                               'assessed': 1,\n",
       "                               'assigned': 1,\n",
       "                               'assisted': 1,\n",
       "                               'associated': 4,\n",
       "                               'assumed': 1,\n",
       "                               'assured': 1,\n",
       "                               'attached': 2,\n",
       "                               'attempted': 1,\n",
       "                               'attracted': 2,\n",
       "                               'attributed': 2,\n",
       "                               'auctioned': 3,\n",
       "                               'automated': 1,\n",
       "                               'averted': 1,\n",
       "                               'awarded': 4,\n",
       "                               'backed': 2,\n",
       "                               'banned': 2,\n",
       "                               'barred': 8,\n",
       "                               'based': 31,\n",
       "                               'battered': 1,\n",
       "                               'beaten': 2,\n",
       "                               'become': 7,\n",
       "                               'been': 150,\n",
       "                               'begun': 2,\n",
       "                               'beleaguered': 1,\n",
       "                               'believed': 4,\n",
       "                               'blamed': 3,\n",
       "                               'blocked': 1,\n",
       "                               'bolstered': 2,\n",
       "                               'boosted': 5,\n",
       "                               'born': 1,\n",
       "                               'borrowed': 1,\n",
       "                               'bought': 2,\n",
       "                               'bribed': 1,\n",
       "                               'broken': 4,\n",
       "                               'brought': 3,\n",
       "                               'built': 11,\n",
       "                               'buoyed': 1,\n",
       "                               'burned': 1,\n",
       "                               'calculated': 1,\n",
       "                               'called': 13,\n",
       "                               'capitalized': 2,\n",
       "                               'capped': 1,\n",
       "                               'carried': 3,\n",
       "                               'cast': 3,\n",
       "                               'caught': 4,\n",
       "                               'caused': 9,\n",
       "                               'centralized': 1,\n",
       "                               'chaired': 2,\n",
       "                               'changed': 7,\n",
       "                               'characterized': 1,\n",
       "                               'charged': 3,\n",
       "                               'chastised': 1,\n",
       "                               'chilled': 1,\n",
       "                               'chopped': 1,\n",
       "                               'chosen': 4,\n",
       "                               'cited': 2,\n",
       "                               'clamped': 1,\n",
       "                               'clarified': 1,\n",
       "                               'clashed': 1,\n",
       "                               'classed': 1,\n",
       "                               'classified': 1,\n",
       "                               'cleaned': 1,\n",
       "                               'climbed': 1,\n",
       "                               'clobbered': 1,\n",
       "                               'closed': 5,\n",
       "                               'cluttered': 1,\n",
       "                               'coated': 1,\n",
       "                               'codified': 1,\n",
       "                               'collapsed': 1,\n",
       "                               'collected': 3,\n",
       "                               'colored': 1,\n",
       "                               'combined': 6,\n",
       "                               'come': 7,\n",
       "                               'commanded': 1,\n",
       "                               'committed': 2,\n",
       "                               'compared': 32,\n",
       "                               'competed': 1,\n",
       "                               'compiled': 2,\n",
       "                               'complained': 1,\n",
       "                               'completed': 6,\n",
       "                               'complicated': 1,\n",
       "                               'composed': 1,\n",
       "                               'compressed': 1,\n",
       "                               'concerned': 2,\n",
       "                               'concluded': 1,\n",
       "                               'condemned': 1,\n",
       "                               'conducted': 1,\n",
       "                               'confined': 2,\n",
       "                               'confirmed': 2,\n",
       "                               'confused': 1,\n",
       "                               'connected': 2,\n",
       "                               'consented': 1,\n",
       "                               'considered': 9,\n",
       "                               'construed': 1,\n",
       "                               'contacted': 3,\n",
       "                               'contained': 2,\n",
       "                               'continued': 6,\n",
       "                               'contributed': 1,\n",
       "                               'controlled': 1,\n",
       "                               'converted': 1,\n",
       "                               'convicted': 3,\n",
       "                               'convinced': 1,\n",
       "                               'cooled': 2,\n",
       "                               'corrected': 1,\n",
       "                               'coupled': 3,\n",
       "                               'covered': 5,\n",
       "                               'created': 4,\n",
       "                               'crippled': 2,\n",
       "                               'crossed': 1,\n",
       "                               'crowded': 1,\n",
       "                               'cultivated': 1,\n",
       "                               'curbed': 1,\n",
       "                               'cushioned': 1,\n",
       "                               'customized': 1,\n",
       "                               'cut': 3,\n",
       "                               'damaged': 2,\n",
       "                               'dashed': 1,\n",
       "                               'decided': 3,\n",
       "                               'declared': 1,\n",
       "                               'decorated': 1,\n",
       "                               'deemed': 1,\n",
       "                               'defined': 1,\n",
       "                               'delayed': 1,\n",
       "                               'delisted': 1,\n",
       "                               'delivered': 5,\n",
       "                               'denied': 3,\n",
       "                               'depleted': 1,\n",
       "                               'depressed': 1,\n",
       "                               'deprived': 1,\n",
       "                               'derived': 1,\n",
       "                               'described': 4,\n",
       "                               'designated': 1,\n",
       "                               'designed': 20,\n",
       "                               'desired': 2,\n",
       "                               'despised': 1,\n",
       "                               'detailed': 1,\n",
       "                               'deteriorated': 1,\n",
       "                               'determined': 3,\n",
       "                               'developed': 3,\n",
       "                               'diagnosed': 1,\n",
       "                               'died': 1,\n",
       "                               'diluted': 2,\n",
       "                               'diminished': 2,\n",
       "                               'directed': 1,\n",
       "                               'disappointed': 3,\n",
       "                               'disapproved': 1,\n",
       "                               'discarded': 1,\n",
       "                               'disclosed': 13,\n",
       "                               'discontinued': 2,\n",
       "                               'discovered': 5,\n",
       "                               'discussed': 3,\n",
       "                               'dismissed': 2,\n",
       "                               'disputed': 1,\n",
       "                               'distributed': 1,\n",
       "                               'diversified': 1,\n",
       "                               'divided': 4,\n",
       "                               'documented': 1,\n",
       "                               'dominated': 2,\n",
       "                               'done': 5,\n",
       "                               'drafted': 1,\n",
       "                               'drawn': 3,\n",
       "                               'dressed': 1,\n",
       "                               'dropped': 1,\n",
       "                               'dumped': 2,\n",
       "                               'earned': 1,\n",
       "                               'echoed': 1,\n",
       "                               'edged': 1,\n",
       "                               'educated': 1,\n",
       "                               'elected': 6,\n",
       "                               'eliminated': 6,\n",
       "                               'embroiled': 1,\n",
       "                               'employed': 3,\n",
       "                               'empowered': 1,\n",
       "                               'enacted': 2,\n",
       "                               'enclosed': 1,\n",
       "                               'ended': 3,\n",
       "                               'endorsed': 1,\n",
       "                               'engaged': 2,\n",
       "                               'engineered': 1,\n",
       "                               'enhanced': 1,\n",
       "                               'enjoyed': 1,\n",
       "                               'ensnarled': 1,\n",
       "                               'entered': 2,\n",
       "                               'entrenched': 1,\n",
       "                               'entrusted': 2,\n",
       "                               'equipped': 1,\n",
       "                               'escalated': 1,\n",
       "                               'estimated': 12,\n",
       "                               'exacerbated': 1,\n",
       "                               'examined': 1,\n",
       "                               'excited': 1,\n",
       "                               'executed': 3,\n",
       "                               'exercised': 3,\n",
       "                               'exhausted': 1,\n",
       "                               'exhibited': 1,\n",
       "                               'existed': 1,\n",
       "                               'expanded': 1,\n",
       "                               'expected': 52,\n",
       "                               'expedited': 1,\n",
       "                               'expelled': 2,\n",
       "                               'experienced': 1,\n",
       "                               'exposed': 2,\n",
       "                               'expressed': 2,\n",
       "                               'expunged': 1,\n",
       "                               'extended': 1,\n",
       "                               'faced': 2,\n",
       "                               'faded': 1,\n",
       "                               'failed': 6,\n",
       "                               'fallen': 6,\n",
       "                               'fashioned': 1,\n",
       "                               'fattened': 1,\n",
       "                               'favored': 1,\n",
       "                               'feared': 1,\n",
       "                               'fed': 1,\n",
       "                               'felt': 1,\n",
       "                               'filed': 13,\n",
       "                               'filled': 1,\n",
       "                               'finalized': 1,\n",
       "                               'financed': 4,\n",
       "                               'fined': 18,\n",
       "                               'finished': 1,\n",
       "                               'fired': 3,\n",
       "                               'fixed': 9,\n",
       "                               'fizzled': 1,\n",
       "                               'flirted': 1,\n",
       "                               'floated': 1,\n",
       "                               'flooded': 1,\n",
       "                               'focused': 5,\n",
       "                               'followed': 6,\n",
       "                               'forced': 4,\n",
       "                               'forecast': 1,\n",
       "                               'forgiven': 2,\n",
       "                               'forgotten': 1,\n",
       "                               'formed': 5,\n",
       "                               'found': 10,\n",
       "                               'founded': 2,\n",
       "                               'frightened': 1,\n",
       "                               'frozen': 2,\n",
       "                               'fueled': 3,\n",
       "                               'funded': 3,\n",
       "                               'gained': 3,\n",
       "                               'generated': 1,\n",
       "                               'given': 11,\n",
       "                               'gone': 3,\n",
       "                               'gored': 1,\n",
       "                               'got': 7,\n",
       "                               'gotten': 4,\n",
       "                               'granted': 1,\n",
       "                               'grown': 4,\n",
       "                               'guaranteed': 1,\n",
       "                               'had': 5,\n",
       "                               'hailed': 1,\n",
       "                               'halted': 1,\n",
       "                               'hampered': 1,\n",
       "                               'handled': 2,\n",
       "                               'harmed': 1,\n",
       "                               'harvested': 1,\n",
       "                               'headed': 1,\n",
       "                               'headlined': 1,\n",
       "                               'heard': 3,\n",
       "                               'heated': 1,\n",
       "                               'heightened': 1,\n",
       "                               'held': 18,\n",
       "                               'helped': 6,\n",
       "                               'hidden': 1,\n",
       "                               'hired': 1,\n",
       "                               'hit': 3,\n",
       "                               'hunted': 1,\n",
       "                               'hurt': 6,\n",
       "                               'identified': 2,\n",
       "                               'impaired': 1,\n",
       "                               'implemented': 1,\n",
       "                               'imported': 2,\n",
       "                               'imposed': 1,\n",
       "                               'impressed': 1,\n",
       "                               'improved': 7,\n",
       "                               'included': 3,\n",
       "                               'incorporated': 1,\n",
       "                               'increased': 14,\n",
       "                               'incurred': 3,\n",
       "                               'indicated': 4,\n",
       "                               'industrialized': 2,\n",
       "                               'inflated': 1,\n",
       "                               'influenced': 1,\n",
       "                               'infringed': 1,\n",
       "                               'initiated': 1,\n",
       "                               'inserted': 1,\n",
       "                               'installed': 2,\n",
       "                               'instituted': 2,\n",
       "                               'instructed': 1,\n",
       "                               'insured': 1,\n",
       "                               'integrated': 3,\n",
       "                               'intended': 3,\n",
       "                               'interested': 1,\n",
       "                               'interrogated': 1,\n",
       "                               'interviewed': 2,\n",
       "                               'introduced': 3,\n",
       "                               'invented': 1,\n",
       "                               'invested': 6,\n",
       "                               'involved': 9,\n",
       "                               'issued': 9,\n",
       "                               'judged': 1,\n",
       "                               'jumped': 3,\n",
       "                               'justified': 1,\n",
       "                               'kept': 3,\n",
       "                               'kicked': 1,\n",
       "                               'killed': 1,\n",
       "                               'knitted': 1,\n",
       "                               'known': 12,\n",
       "                               'labeled': 2,\n",
       "                               'laid': 1,\n",
       "                               'launched': 8,\n",
       "                               'learned': 1,\n",
       "                               'led': 9,\n",
       "                               'left': 6,\n",
       "                               'lent': 1,\n",
       "                               'licensed': 1,\n",
       "                               'lifted': 1,\n",
       "                               'limited': 5,\n",
       "                               'linked': 2,\n",
       "                               'liquidated': 2,\n",
       "                               'listed': 9,\n",
       "                               'loaded': 2,\n",
       "                               'located': 4,\n",
       "                               'locked': 2,\n",
       "                               'looked': 1,\n",
       "                               'lost': 5,\n",
       "                               'lowered': 2,\n",
       "                               'made': 33,\n",
       "                               'magnified': 1,\n",
       "                               'mailed': 1,\n",
       "                               'maintained': 2,\n",
       "                               'managed': 5,\n",
       "                               'manufactured': 2,\n",
       "                               'marketed': 3,\n",
       "                               'matched': 2,\n",
       "                               'meant': 1,\n",
       "                               'measured': 2,\n",
       "                               'mentioned': 1,\n",
       "                               'merged': 1,\n",
       "                               'met': 3,\n",
       "                               'midsized': 1,\n",
       "                               'milked': 1,\n",
       "                               'minted': 1,\n",
       "                               'mired': 2,\n",
       "                               'missed': 1,\n",
       "                               'mixed': 7,\n",
       "                               'moderated': 2,\n",
       "                               'mollified': 1,\n",
       "                               'mortgaged': 1,\n",
       "                               'mounted': 1,\n",
       "                               'moved': 2,\n",
       "                               'muffled': 1,\n",
       "                               'murdered': 2,\n",
       "                               'muted': 1,\n",
       "                               'named': 20,\n",
       "                               'needed': 9,\n",
       "                               'negotiated': 1,\n",
       "                               'nominated': 1,\n",
       "                               'noted': 3,\n",
       "                               'noticed': 1,\n",
       "                               'notified': 1,\n",
       "                               'nullified': 1,\n",
       "                               'nurtured': 1,\n",
       "                               'obligated': 1,\n",
       "                               'observed': 1,\n",
       "                               'obsessed': 1,\n",
       "                               'obtained': 2,\n",
       "                               'offered': 10,\n",
       "                               'offset': 6,\n",
       "                               'omitted': 1,\n",
       "                               'opened': 4,\n",
       "                               'operated': 2,\n",
       "                               'opposed': 6,\n",
       "                               'orchestrated': 1,\n",
       "                               'ordered': 9,\n",
       "                               'organized': 2,\n",
       "                               'oriented': 2,\n",
       "                               'outdistanced': 1,\n",
       "                               'outlawed': 1,\n",
       "                               'outpaced': 1,\n",
       "                               'overcome': 1,\n",
       "                               'overdone': 1,\n",
       "                               'overpriced': 1,\n",
       "                               'overstated': 1,\n",
       "                               'overused': 1,\n",
       "                               'owed': 3,\n",
       "                               'own': 1,\n",
       "                               'owned': 6,\n",
       "                               'paid': 15,\n",
       "                               'painted': 1,\n",
       "                               'parched': 1,\n",
       "                               'passed': 3,\n",
       "                               'pegged': 2,\n",
       "                               'perceived': 2,\n",
       "                               'performed': 3,\n",
       "                               'permitted': 3,\n",
       "                               'placed': 6,\n",
       "                               'plagued': 1,\n",
       "                               'planned': 8,\n",
       "                               'planted': 1,\n",
       "                               'played': 3,\n",
       "                               'pleased': 4,\n",
       "                               'plunged': 1,\n",
       "                               'pointed': 1,\n",
       "                               'polarized': 1,\n",
       "                               'polled': 1,\n",
       "                               'populated': 1,\n",
       "                               'portrayed': 1,\n",
       "                               'positioned': 2,\n",
       "                               'posted': 3,\n",
       "                               'postponed': 1,\n",
       "                               'practiced': 1,\n",
       "                               'preapproved': 1,\n",
       "                               'predicated': 1,\n",
       "                               'preferred': 9,\n",
       "                               'prepared': 9,\n",
       "                               'presented': 2,\n",
       "                               'pressed': 2,\n",
       "                               'priced': 26,\n",
       "                               'printed': 2,\n",
       "                               'produced': 8,\n",
       "                               'prohibited': 1,\n",
       "                               'prolonged': 2,\n",
       "                               'promised': 1,\n",
       "                               'prompted': 2,\n",
       "                               'proposed': 12,\n",
       "                               'prosecuted': 1,\n",
       "                               'protected': 1,\n",
       "                               'proved': 1,\n",
       "                               'proven': 1,\n",
       "                               'provided': 7,\n",
       "                               'provoked': 1,\n",
       "                               'publicized': 2,\n",
       "                               'purchased': 2,\n",
       "                               'pursued': 3,\n",
       "                               'pushed': 2,\n",
       "                               'put': 8,\n",
       "                               'puzzled': 1,\n",
       "                               'qualified': 4,\n",
       "                               'quoted': 6,\n",
       "                               'raised': 6,\n",
       "                               'ranged': 3,\n",
       "                               'rarefied': 1,\n",
       "                               'rated': 1,\n",
       "                               'ratified': 1,\n",
       "                               'rationed': 1,\n",
       "                               'reached': 13,\n",
       "                               'read': 1,\n",
       "                               'reallocated': 1,\n",
       "                               'reaped': 1,\n",
       "                               'received': 10,\n",
       "                               'reclaimed': 1,\n",
       "                               'recorded': 1,\n",
       "                               'recouped': 1,\n",
       "                               'recruited': 1,\n",
       "                               'rectified': 1,\n",
       "                               'recycled': 1,\n",
       "                               'redeemed': 3,\n",
       "                               'reduced': 5,\n",
       "                               'referred': 2,\n",
       "                               'reflected': 1,\n",
       "                               'refunded': 1,\n",
       "                               'refused': 4,\n",
       "                               'regarded': 3,\n",
       "                               'registered': 5,\n",
       "                               'regulated': 3,\n",
       "                               'reimbursed': 1,\n",
       "                               'rejected': 4,\n",
       "                               'related': 7,\n",
       "                               'relaunched': 1,\n",
       "                               'released': 2,\n",
       "                               'relegated': 2,\n",
       "                               'relied': 1,\n",
       "                               'remarked': 1,\n",
       "                               'removed': 2,\n",
       "                               'renewed': 3,\n",
       "                               'renovated': 1,\n",
       "                               'reorganized': 1,\n",
       "                               'repaid': 2,\n",
       "                               'repaired': 1,\n",
       "                               'replaced': 5,\n",
       "                               'replicated': 1,\n",
       "                               'reported': 12,\n",
       "                               'represented': 1,\n",
       "                               'repriced': 1,\n",
       "                               'requested': 3,\n",
       "                               'required': 9,\n",
       "                               'rescheduled': 1,\n",
       "                               'respected': 3,\n",
       "                               'responded': 1,\n",
       "                               'restructured': 2,\n",
       "                               'resulted': 1,\n",
       "                               'retained': 2,\n",
       "                               'retired': 4,\n",
       "                               'returned': 3,\n",
       "                               'revised': 1,\n",
       "                               'revived': 3,\n",
       "                               'rigged': 1,\n",
       "                               'risen': 2,\n",
       "                               'robbed': 1,\n",
       "                               'rolled': 1,\n",
       "                               'romanticized': 2,\n",
       "                               'rooted': 1,\n",
       "                               'rumored': 3,\n",
       "                               'run': 6,\n",
       "                               'rung': 2,\n",
       "                               'rusted': 1,\n",
       "                               'said': 14,\n",
       "                               'scared': 1,\n",
       "                               'scattered': 1,\n",
       "                               'scheduled': 13,\n",
       "                               'scrambled': 1,\n",
       "                               'scrapped': 1,\n",
       "                               'secured': 2,\n",
       "                               'seen': 8,\n",
       "                               'selected': 2,\n",
       "                               'sent': 4,\n",
       "                               'served': 1,\n",
       "                               'serviced': 1,\n",
       "                               'set': 12,\n",
       "                               'settled': 2,\n",
       "                               'shaken': 1,\n",
       "                               'shared': 1,\n",
       "                               'shipped': 6,\n",
       "                               'shown': 1,\n",
       "                               'shut': 1,\n",
       "                               'signed': 3,\n",
       "                               'singled': 1,\n",
       "                               'skyrocketed': 2,\n",
       "                               'slated': 1,\n",
       "                               'slowed': 1,\n",
       "                               'snapped': 1,\n",
       "                               'soared': 3,\n",
       "                               'sold': 25,\n",
       "                               'solved': 1,\n",
       "                               'sought': 6,\n",
       "                               'sparked': 1,\n",
       "                               'specialized': 2,\n",
       "                               'specified': 3,\n",
       "                               'speculated': 1,\n",
       "                               'spent': 4,\n",
       "                               'split': 2,\n",
       "                               'spooked': 1,\n",
       "                               'spread': 2,\n",
       "                               'spun': 1,\n",
       "                               'spurred': 3,\n",
       "                               'squeezed': 1,\n",
       "                               'stabbed': 1,\n",
       "                               'stacked': 1,\n",
       "                               'staid': 1,\n",
       "                               'started': 2,\n",
       "                               'stated': 1,\n",
       "                               'stepped': 1,\n",
       "                               'stimulated': 1,\n",
       "                               'stoked': 1,\n",
       "                               'stopped': 3,\n",
       "                               'strapped': 1,\n",
       "                               'stressed': 1,\n",
       "                               'stripped': 1,\n",
       "                               'structured': 1,\n",
       "                               'studied': 4,\n",
       "                               'subdued': 2,\n",
       "                               'subordinated': 3,\n",
       "                               'subpoenaed': 1,\n",
       "                               'superimposed': 1,\n",
       "                               'supported': 2,\n",
       "                               'surfaced': 1,\n",
       "                               'surged': 2,\n",
       "                               'surprised': 2,\n",
       "                               'surveyed': 1,\n",
       "                               'suspended': 7,\n",
       "                               'sustained': 2,\n",
       "                               'swapped': 1,\n",
       "                               'sweetened': 1,\n",
       "                               'switched': 1,\n",
       "                               'synchronized': 1,\n",
       "                               'tailored': 1,\n",
       "                               'taken': 16,\n",
       "                               'talked': 1,\n",
       "                               'tanked': 1,\n",
       "                               'targeted': 2,\n",
       "                               'tendered': 3,\n",
       "                               'terminated': 1,\n",
       "                               'tested': 3,\n",
       "                               'thought': 2,\n",
       "                               'threatened': 6,\n",
       "                               'tied': 3,\n",
       "                               'tightened': 1,\n",
       "                               'told': 2,\n",
       "                               'topped': 1,\n",
       "                               'torn': 1,\n",
       "                               'touted': 1,\n",
       "                               'tracked': 1,\n",
       "                               'traded': 15,\n",
       "                               'trained': 2,\n",
       "                               'transformed': 1,\n",
       "                               'treated': 1,\n",
       "                               'tried': 2,\n",
       "                               'triggered': 3,\n",
       "                               'trimmed': 1,\n",
       "                               'tripled': 1,\n",
       "                               'troubled': 1,\n",
       "                               'turned': 4,\n",
       "                               'twinned': 1,\n",
       "                               'understood': 1,\n",
       "                               'unsettled': 1,\n",
       "                               'upheld': 1,\n",
       "                               'upset': 2,\n",
       "                               'used': 26,\n",
       "                               'valued': 8,\n",
       "                               'vested': 1,\n",
       "                               'viewed': 3,\n",
       "                               'voted': 2,\n",
       "                               'vowed': 1,\n",
       "                               'wanted': 1,\n",
       "                               'warned': 2,\n",
       "                               'wasted': 1,\n",
       "                               'watched': 1,\n",
       "                               'wedded': 1,\n",
       "                               'welcomed': 1,\n",
       "                               'withdrawn': 5,\n",
       "                               'won': 1,\n",
       "                               'worked': 2,\n",
       "                               'worried': 6,\n",
       "                               'written': 5,\n",
       "                               'zoomed': 1}),\n",
       "                     'VBP': FreqDist({\"'m\": 13,\n",
       "                               \"'re\": 29,\n",
       "                               \"'ve\": 16,\n",
       "                               'Am': 1,\n",
       "                               'Do': 3,\n",
       "                               'Lure': 1,\n",
       "                               'accept': 1,\n",
       "                               'account': 3,\n",
       "                               'add': 1,\n",
       "                               'advise': 1,\n",
       "                               'advocate': 1,\n",
       "                               'affect': 1,\n",
       "                               'agree': 2,\n",
       "                               'ai': 1,\n",
       "                               'air': 1,\n",
       "                               'allow': 3,\n",
       "                               'am': 1,\n",
       "                               'amass': 1,\n",
       "                               'appeal': 1,\n",
       "                               'appear': 3,\n",
       "                               'applaud': 1,\n",
       "                               'approach': 2,\n",
       "                               'approve': 4,\n",
       "                               'are': 367,\n",
       "                               'argue': 5,\n",
       "                               'arise': 1,\n",
       "                               'ascribe': 1,\n",
       "                               'ask': 1,\n",
       "                               'assist': 1,\n",
       "                               'assume': 2,\n",
       "                               'attract': 2,\n",
       "                               'avoid': 1,\n",
       "                               'bankroll': 1,\n",
       "                               'battle': 1,\n",
       "                               'beat': 1,\n",
       "                               'become': 1,\n",
       "                               'begin': 1,\n",
       "                               'believe': 11,\n",
       "                               'belong': 2,\n",
       "                               'blip': 1,\n",
       "                               'build': 1,\n",
       "                               'burn': 1,\n",
       "                               'buy': 2,\n",
       "                               'calculate': 1,\n",
       "                               'call': 2,\n",
       "                               'carry': 2,\n",
       "                               'cater': 1,\n",
       "                               'cause': 2,\n",
       "                               'change': 1,\n",
       "                               'channel': 1,\n",
       "                               'charge': 2,\n",
       "                               'cite': 1,\n",
       "                               'claim': 4,\n",
       "                               'come': 5,\n",
       "                               'commit': 1,\n",
       "                               'compare': 1,\n",
       "                               'complain': 1,\n",
       "                               'concede': 1,\n",
       "                               'conclude': 1,\n",
       "                               'conduct': 1,\n",
       "                               'conflict': 1,\n",
       "                               'consider': 3,\n",
       "                               'consist': 2,\n",
       "                               'constitute': 1,\n",
       "                               'contain': 3,\n",
       "                               'continue': 7,\n",
       "                               'contrast': 1,\n",
       "                               'convey': 1,\n",
       "                               'copy': 1,\n",
       "                               'create': 1,\n",
       "                               'cry': 1,\n",
       "                               'deal': 1,\n",
       "                               'decide': 1,\n",
       "                               'decline': 3,\n",
       "                               'deem': 1,\n",
       "                               'delay': 1,\n",
       "                               'deliver': 1,\n",
       "                               'denounce': 1,\n",
       "                               'describe': 1,\n",
       "                               'deserve': 2,\n",
       "                               'determine': 1,\n",
       "                               'devise': 1,\n",
       "                               'differ': 1,\n",
       "                               'disagree': 2,\n",
       "                               'disapprove': 1,\n",
       "                               'dislike': 1,\n",
       "                               'dismiss': 1,\n",
       "                               'do': 51,\n",
       "                               'draw': 1,\n",
       "                               'drift': 1,\n",
       "                               'drink': 2,\n",
       "                               'drive': 2,\n",
       "                               'ease': 1,\n",
       "                               'eat': 1,\n",
       "                               'eliminate': 1,\n",
       "                               'encourage': 2,\n",
       "                               'engage': 1,\n",
       "                               'enjoy': 1,\n",
       "                               'espouse': 1,\n",
       "                               'evoke': 1,\n",
       "                               'examine': 1,\n",
       "                               'exceed': 1,\n",
       "                               'exhaust': 1,\n",
       "                               'exist': 1,\n",
       "                               'expect': 6,\n",
       "                               'expire': 3,\n",
       "                               'extend': 1,\n",
       "                               'face': 3,\n",
       "                               'fail': 3,\n",
       "                               'fall': 3,\n",
       "                               'fare': 2,\n",
       "                               'fault': 1,\n",
       "                               'fear': 1,\n",
       "                               'feed': 2,\n",
       "                               'feel': 8,\n",
       "                               'figure': 1,\n",
       "                               'find': 5,\n",
       "                               'flush': 1,\n",
       "                               'fly': 1,\n",
       "                               'follow': 1,\n",
       "                               'force': 1,\n",
       "                               'forecast': 1,\n",
       "                               'get': 7,\n",
       "                               'give': 6,\n",
       "                               'gloss': 1,\n",
       "                               'go': 4,\n",
       "                               'hamstrung': 1,\n",
       "                               'hang': 1,\n",
       "                               'has': 1,\n",
       "                               'have': 221,\n",
       "                               'help': 2,\n",
       "                               'hire': 1,\n",
       "                               'hit': 1,\n",
       "                               'hold': 3,\n",
       "                               'hope': 3,\n",
       "                               'hurt': 1,\n",
       "                               'imply': 1,\n",
       "                               'import': 1,\n",
       "                               'improve': 1,\n",
       "                               'include': 11,\n",
       "                               'indicate': 1,\n",
       "                               'insist': 5,\n",
       "                               'intend': 1,\n",
       "                               'invest': 2,\n",
       "                               'jet': 1,\n",
       "                               'jostle': 1,\n",
       "                               'keep': 1,\n",
       "                               'kill': 1,\n",
       "                               'know': 6,\n",
       "                               'lack': 2,\n",
       "                               'lead': 5,\n",
       "                               'leave': 1,\n",
       "                               'lengthen': 1,\n",
       "                               'let': 1,\n",
       "                               'like': 4,\n",
       "                               'line': 1,\n",
       "                               'live': 2,\n",
       "                               'lock': 1,\n",
       "                               'look': 5,\n",
       "                               'loom': 1,\n",
       "                               'make': 10,\n",
       "                               'manage': 1,\n",
       "                               'mark': 1,\n",
       "                               'materialize': 1,\n",
       "                               'mature': 4,\n",
       "                               'mean': 1,\n",
       "                               'meet': 3,\n",
       "                               'memorize': 1,\n",
       "                               'mention': 1,\n",
       "                               'mirror': 1,\n",
       "                               'need': 13,\n",
       "                               'note': 2,\n",
       "                               'occur': 1,\n",
       "                               'offer': 4,\n",
       "                               'offset': 1,\n",
       "                               'operate': 2,\n",
       "                               'oppose': 5,\n",
       "                               'own': 2,\n",
       "                               'paint': 1,\n",
       "                               'pay': 5,\n",
       "                               'permit': 1,\n",
       "                               'perpetuate': 1,\n",
       "                               'pine': 1,\n",
       "                               'place': 1,\n",
       "                               'plan': 2,\n",
       "                               'plans': 1,\n",
       "                               'play': 1,\n",
       "                               'point': 2,\n",
       "                               'portray': 1,\n",
       "                               'possess': 1,\n",
       "                               'predict': 1,\n",
       "                               'prefer': 1,\n",
       "                               'prevent': 1,\n",
       "                               'print': 1,\n",
       "                               'profess': 1,\n",
       "                               'profit': 1,\n",
       "                               'promise': 1,\n",
       "                               'promote': 1,\n",
       "                               'propose': 1,\n",
       "                               'prove': 1,\n",
       "                               'provide': 2,\n",
       "                               'pull': 1,\n",
       "                               'pursue': 1,\n",
       "                               'push': 1,\n",
       "                               'question': 1,\n",
       "                               'raise': 3,\n",
       "                               'range': 1,\n",
       "                               'reach': 1,\n",
       "                               'read': 2,\n",
       "                               'realize': 1,\n",
       "                               'recede': 1,\n",
       "                               'receive': 2,\n",
       "                               'recognize': 1,\n",
       "                               'refer': 1,\n",
       "                               'reflect': 2,\n",
       "                               'refuse': 2,\n",
       "                               'regard': 2,\n",
       "                               'represent': 5,\n",
       "                               'require': 2,\n",
       "                               'resent': 1,\n",
       "                               'respond': 1,\n",
       "                               'return': 1,\n",
       "                               'ring': 1,\n",
       "                               'ripen': 1,\n",
       "                               'rise': 4,\n",
       "                               'run': 2,\n",
       "                               'say': 56,\n",
       "                               'scrounge': 1,\n",
       "                               'see': 4,\n",
       "                               'seek': 4,\n",
       "                               'seem': 8,\n",
       "                               'sell': 5,\n",
       "                               'send': 1,\n",
       "                               'sense': 1,\n",
       "                               'set': 2,\n",
       "                               'settle': 1,\n",
       "                               'show': 4,\n",
       "                               'sidestep': 1,\n",
       "                               'skip': 1,\n",
       "                               'sound': 1,\n",
       "                               'spend': 1,\n",
       "                               'spook': 1,\n",
       "                               'stand': 5,\n",
       "                               'stare': 1,\n",
       "                               'start': 2,\n",
       "                               'state': 1,\n",
       "                               'stem': 1,\n",
       "                               'stop': 1,\n",
       "                               'stretch': 1,\n",
       "                               'study': 1,\n",
       "                               'subscribe': 1,\n",
       "                               'succeed': 1,\n",
       "                               'suffer': 2,\n",
       "                               'suggest': 4,\n",
       "                               'suspect': 2,\n",
       "                               'swim': 1,\n",
       "                               'swing': 1,\n",
       "                               'take': 5,\n",
       "                               'talk': 1,\n",
       "                               'teach': 1,\n",
       "                               'telegraph': 1,\n",
       "                               'tell': 1,\n",
       "                               'tend': 3,\n",
       "                               'test': 1,\n",
       "                               'test-drive': 1,\n",
       "                               'think': 14,\n",
       "                               'total': 2,\n",
       "                               'touch': 1,\n",
       "                               'trade': 5,\n",
       "                               'transcribe': 1,\n",
       "                               'trespass': 1,\n",
       "                               'try': 1,\n",
       "                               'tune': 2,\n",
       "                               'undercut': 1,\n",
       "                               'underscore': 1,\n",
       "                               'understand': 1,\n",
       "                               'urge': 1,\n",
       "                               'use': 8,\n",
       "                               'view': 1,\n",
       "                               'violate': 3,\n",
       "                               'voice': 1,\n",
       "                               'walk': 4,\n",
       "                               'want': 16,\n",
       "                               'warn': 1,\n",
       "                               'watch': 3,\n",
       "                               'weaken': 1,\n",
       "                               'weigh': 1,\n",
       "                               'whistle': 1,\n",
       "                               'win': 1,\n",
       "                               'work': 1,\n",
       "                               'worry': 3}),\n",
       "                     'VBZ': FreqDist({\"'S\": 1,\n",
       "                               \"'s\": 103,\n",
       "                               'AGREES': 1,\n",
       "                               'APPEARS': 1,\n",
       "                               'Adds': 2,\n",
       "                               'CLEARS': 1,\n",
       "                               'Closes': 1,\n",
       "                               'Competes': 1,\n",
       "                               'Earns': 1,\n",
       "                               'Fails': 1,\n",
       "                               'Is': 1,\n",
       "                               'Says': 7,\n",
       "                               'Takes': 1,\n",
       "                               'Touches': 1,\n",
       "                               'accounts': 1,\n",
       "                               'aces': 1,\n",
       "                               'acknowledges': 1,\n",
       "                               'acquires': 1,\n",
       "                               'acts': 2,\n",
       "                               'adds': 10,\n",
       "                               'admits': 4,\n",
       "                               'agrees': 2,\n",
       "                               'aims': 1,\n",
       "                               'alerts': 1,\n",
       "                               'amounts': 1,\n",
       "                               'answers': 1,\n",
       "                               'anticipates': 2,\n",
       "                               'appears': 8,\n",
       "                               'approves': 1,\n",
       "                               'argues': 1,\n",
       "                               'asks': 5,\n",
       "                               'aspires': 1,\n",
       "                               'asserts': 1,\n",
       "                               'attempts': 2,\n",
       "                               'attracts': 1,\n",
       "                               'attributes': 1,\n",
       "                               'authorizes': 1,\n",
       "                               'awaits': 1,\n",
       "                               'awards': 1,\n",
       "                               'bans': 1,\n",
       "                               'becomes': 7,\n",
       "                               'begins': 4,\n",
       "                               'believes': 12,\n",
       "                               'belongs': 2,\n",
       "                               'benefits': 2,\n",
       "                               'blames': 1,\n",
       "                               'blinks': 1,\n",
       "                               'blocks': 1,\n",
       "                               'boosts': 3,\n",
       "                               'breaks': 3,\n",
       "                               'brings': 2,\n",
       "                               'broadcasts': 1,\n",
       "                               'builds': 1,\n",
       "                               'buys': 1,\n",
       "                               'calls': 5,\n",
       "                               'carries': 4,\n",
       "                               'casts': 2,\n",
       "                               'causes': 1,\n",
       "                               'centers': 1,\n",
       "                               'changes': 1,\n",
       "                               'charges': 2,\n",
       "                               'chooses': 2,\n",
       "                               'cites': 3,\n",
       "                               'claims': 4,\n",
       "                               'combines': 1,\n",
       "                               'comes': 7,\n",
       "                               'comments': 1,\n",
       "                               'compares': 3,\n",
       "                               'competes': 2,\n",
       "                               'complains': 2,\n",
       "                               'concedes': 1,\n",
       "                               'confirms': 1,\n",
       "                               'conforms': 1,\n",
       "                               'considers': 3,\n",
       "                               'consists': 1,\n",
       "                               'contains': 1,\n",
       "                               'contends': 3,\n",
       "                               'continues': 13,\n",
       "                               'contrasts': 1,\n",
       "                               'controls': 1,\n",
       "                               'costs': 4,\n",
       "                               'counts': 2,\n",
       "                               'covers': 3,\n",
       "                               'creates': 2,\n",
       "                               'decides': 1,\n",
       "                               'declines': 2,\n",
       "                               'decries': 1,\n",
       "                               'defeats': 1,\n",
       "                               'defends': 1,\n",
       "                               'defines': 1,\n",
       "                               'demonstrates': 1,\n",
       "                               'denies': 3,\n",
       "                               'depends': 1,\n",
       "                               'describes': 3,\n",
       "                               'develops': 1,\n",
       "                               'digs': 1,\n",
       "                               'disagrees': 1,\n",
       "                               'disappears': 1,\n",
       "                               'dissolves': 1,\n",
       "                               'distributes': 1,\n",
       "                               'disturbs': 1,\n",
       "                               'does': 54,\n",
       "                               'dominates': 1,\n",
       "                               'doubts': 1,\n",
       "                               'draws': 1,\n",
       "                               'earns': 3,\n",
       "                               'eases': 1,\n",
       "                               'eliminates': 3,\n",
       "                               'emerges': 1,\n",
       "                               'employs': 3,\n",
       "                               'empowers': 1,\n",
       "                               'enables': 2,\n",
       "                               'encourages': 1,\n",
       "                               'ends': 1,\n",
       "                               'enhances': 1,\n",
       "                               'enters': 4,\n",
       "                               'entitles': 2,\n",
       "                               'equals': 1,\n",
       "                               'erodes': 1,\n",
       "                               'estimates': 2,\n",
       "                               'exceeds': 1,\n",
       "                               'executes': 1,\n",
       "                               'exhibits': 1,\n",
       "                               'exists': 1,\n",
       "                               'expands': 1,\n",
       "                               'expects': 19,\n",
       "                               'expires': 1,\n",
       "                               'explains': 4,\n",
       "                               'faces': 2,\n",
       "                               'factors': 1,\n",
       "                               'fails': 2,\n",
       "                               'falls': 2,\n",
       "                               'favors': 1,\n",
       "                               'feeds': 1,\n",
       "                               'feels': 2,\n",
       "                               'fills': 2,\n",
       "                               'finds': 1,\n",
       "                               'flies': 1,\n",
       "                               'flows': 2,\n",
       "                               'follows': 5,\n",
       "                               'forces': 2,\n",
       "                               'fumes': 1,\n",
       "                               'gains': 1,\n",
       "                               'gauges': 1,\n",
       "                               'gets': 4,\n",
       "                               'gives': 13,\n",
       "                               'goes': 14,\n",
       "                               'grows': 4,\n",
       "                               'handles': 1,\n",
       "                               'hangs': 1,\n",
       "                               'happens': 1,\n",
       "                               'harms': 1,\n",
       "                               'has': 338,\n",
       "                               'heads': 4,\n",
       "                               'helps': 1,\n",
       "                               'holds': 4,\n",
       "                               'hopes': 8,\n",
       "                               'illustrates': 1,\n",
       "                               'implements': 1,\n",
       "                               'implies': 2,\n",
       "                               'imposes': 1,\n",
       "                               'improves': 1,\n",
       "                               'includes': 12,\n",
       "                               'increases': 3,\n",
       "                               'indicates': 7,\n",
       "                               'initiatives': 1,\n",
       "                               'insists': 4,\n",
       "                               'interjects': 1,\n",
       "                               'introduces': 1,\n",
       "                               'invades': 1,\n",
       "                               'invests': 1,\n",
       "                               'involves': 2,\n",
       "                               'is': 671,\n",
       "                               'joins': 2,\n",
       "                               'keeps': 2,\n",
       "                               'knows': 4,\n",
       "                               'lacks': 2,\n",
       "                               'lapses': 1,\n",
       "                               'leaves': 3,\n",
       "                               'lives': 2,\n",
       "                               'looks': 1,\n",
       "                               'loses': 1,\n",
       "                               'makes': 11,\n",
       "                               'manages': 1,\n",
       "                               'mandates': 1,\n",
       "                               'markets': 1,\n",
       "                               'marks': 2,\n",
       "                               'matters': 1,\n",
       "                               'means': 5,\n",
       "                               'measures': 2,\n",
       "                               'meets': 1,\n",
       "                               'mimics': 1,\n",
       "                               'mirrors': 1,\n",
       "                               'moves': 1,\n",
       "                               'needs': 4,\n",
       "                               'notes': 3,\n",
       "                               'occurs': 2,\n",
       "                               'offers': 5,\n",
       "                               'opens': 1,\n",
       "                               'operates': 7,\n",
       "                               'opposes': 1,\n",
       "                               'orders': 1,\n",
       "                               'outranks': 1,\n",
       "                               'outstrips': 1,\n",
       "                               'owns': 18,\n",
       "                               'parallels': 1,\n",
       "                               'perceives': 1,\n",
       "                               'permits': 1,\n",
       "                               'perpetuates': 1,\n",
       "                               'picks': 1,\n",
       "                               'pins': 1,\n",
       "                               'pitches': 1,\n",
       "                               'places': 1,\n",
       "                               'plans': 18,\n",
       "                               'plays': 2,\n",
       "                               'points': 1,\n",
       "                               'posts': 1,\n",
       "                               'precedes': 1,\n",
       "                               'predicts': 1,\n",
       "                               'presumes': 1,\n",
       "                               'prevents': 2,\n",
       "                               'produces': 1,\n",
       "                               'prohibits': 3,\n",
       "                               'projects': 1,\n",
       "                               'promises': 2,\n",
       "                               'prompts': 1,\n",
       "                               'propagandizes': 1,\n",
       "                               'proscribes': 1,\n",
       "                               'protects': 1,\n",
       "                               'provides': 8,\n",
       "                               'publishes': 3,\n",
       "                               'purrs': 1,\n",
       "                               'pushes': 1,\n",
       "                               'puts': 2,\n",
       "                               'quips': 1,\n",
       "                               'raises': 5,\n",
       "                               'rates': 1,\n",
       "                               'reaches': 1,\n",
       "                               'reasons': 1,\n",
       "                               'reasserts': 1,\n",
       "                               'recalls': 1,\n",
       "                               'receives': 1,\n",
       "                               'reflects': 4,\n",
       "                               'refuses': 1,\n",
       "                               'relies': 2,\n",
       "                               'remains': 13,\n",
       "                               'repeals': 1,\n",
       "                               'replies': 1,\n",
       "                               'reports': 2,\n",
       "                               'represents': 4,\n",
       "                               'requires': 6,\n",
       "                               'resembles': 1,\n",
       "                               'resists': 1,\n",
       "                               'responds': 1,\n",
       "                               'restricts': 1,\n",
       "                               'restructures': 1,\n",
       "                               'resumes': 1,\n",
       "                               'retires': 1,\n",
       "                               'returns': 1,\n",
       "                               'revolves': 1,\n",
       "                               'rings': 1,\n",
       "                               'routes': 1,\n",
       "                               'runs': 9,\n",
       "                               'sanctions': 1,\n",
       "                               'says': 210,\n",
       "                               'scans': 1,\n",
       "                               'scoffs': 1,\n",
       "                               'seeks': 4,\n",
       "                               'seems': 8,\n",
       "                               'sees': 2,\n",
       "                               'sells': 8,\n",
       "                               'sends': 1,\n",
       "                               'serves': 1,\n",
       "                               'sets': 2,\n",
       "                               'shows': 7,\n",
       "                               'shrinks': 2,\n",
       "                               'signals': 2,\n",
       "                               'simulates': 1,\n",
       "                               'slides': 1,\n",
       "                               'sounds': 1,\n",
       "                               'speaks': 2,\n",
       "                               'specializes': 2,\n",
       "                               'spends': 2,\n",
       "                               'spurns': 1,\n",
       "                               'stands': 3,\n",
       "                               'starts': 2,\n",
       "                               'states': 2,\n",
       "                               'stays': 1,\n",
       "                               'steps': 1,\n",
       "                               'stresses': 1,\n",
       "                               'succeeds': 2,\n",
       "                               'suggests': 7,\n",
       "                               'supplies': 2,\n",
       "                               'supports': 1,\n",
       "                               'suspects': 1,\n",
       "                               'takes': 10,\n",
       "                               'talks': 2,\n",
       "                               'targets': 2,\n",
       "                               'teaches': 1,\n",
       "                               'tells': 4,\n",
       "                               'tempts': 1,\n",
       "                               'thinks': 3,\n",
       "                               'threatens': 1,\n",
       "                               'throws': 2,\n",
       "                               'tracks': 2,\n",
       "                               'trades': 2,\n",
       "                               'transfers': 1,\n",
       "                               'treats': 1,\n",
       "                               'turns': 3,\n",
       "                               'understands': 1,\n",
       "                               'uses': 4,\n",
       "                               'values': 1,\n",
       "                               'views': 1,\n",
       "                               'wants': 14,\n",
       "                               'warns': 1,\n",
       "                               'warrants': 1,\n",
       "                               'wears': 1,\n",
       "                               'wins': 1,\n",
       "                               'works': 2,\n",
       "                               'worries': 2}),\n",
       "                     'WDT': FreqDist({'THAT': 1,\n",
       "                               'That': 2,\n",
       "                               'that': 214,\n",
       "                               'what': 3,\n",
       "                               'which': 224,\n",
       "                               'whichever': 1}),\n",
       "                     'WP': FreqDist({'What': 19,\n",
       "                               'Who': 4,\n",
       "                               'what': 49,\n",
       "                               'who': 163,\n",
       "                               'whom': 6}),\n",
       "                     'WP$': FreqDist({'whose': 14}),\n",
       "                     'WRB': FreqDist({'How': 3,\n",
       "                               'When': 21,\n",
       "                               'Where': 2,\n",
       "                               'Why': 6,\n",
       "                               'how': 25,\n",
       "                               'when': 77,\n",
       "                               'whenever': 1,\n",
       "                               'where': 34,\n",
       "                               'whereby': 1,\n",
       "                               'why': 8}),\n",
       "                     '``': FreqDist({'`': 10, '``': 702})})"
      ]
     },
     "execution_count": 87,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "cfd2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['named',\n",
       " 'used',\n",
       " 'caused',\n",
       " 'exposed',\n",
       " 'reported',\n",
       " 'replaced',\n",
       " 'sold',\n",
       " 'died',\n",
       " 'expected',\n",
       " 'diagnosed',\n",
       " 'studied',\n",
       " 'industrialized',\n",
       " 'owned',\n",
       " 'found',\n",
       " 'classified',\n",
       " 'rejected',\n",
       " 'outlawed',\n",
       " 'imported',\n",
       " 'tracked',\n",
       " 'thought',\n",
       " 'considered',\n",
       " 'elected',\n",
       " 'based',\n",
       " 'lifted',\n",
       " 'ensnarled',\n",
       " 'voted',\n",
       " 'been',\n",
       " 'held',\n",
       " 'banned',\n",
       " 'renovated',\n",
       " 'prolonged',\n",
       " 'recorded',\n",
       " 'accumulated',\n",
       " 'offered',\n",
       " 'become',\n",
       " 'guaranteed',\n",
       " 'proposed',\n",
       " 'related',\n",
       " 'improved',\n",
       " 'worried',\n",
       " 'cluttered',\n",
       " 'expedited',\n",
       " 'retired',\n",
       " 'ordered',\n",
       " 'collected',\n",
       " 'required',\n",
       " 'received',\n",
       " 'moved',\n",
       " 'determined',\n",
       " 'made',\n",
       " 'changed',\n",
       " 'completed',\n",
       " 'disputed',\n",
       " 'refunded',\n",
       " 'estimated',\n",
       " 'compared',\n",
       " 'located',\n",
       " 'filed',\n",
       " 'scrapped',\n",
       " 'anticipated',\n",
       " 'priced',\n",
       " 'set',\n",
       " 'applied',\n",
       " 'existed',\n",
       " 'incurred',\n",
       " 'reached',\n",
       " 'Regarded',\n",
       " 'paid',\n",
       " 'trained',\n",
       " 'instituted',\n",
       " 'vowed',\n",
       " 'deemed',\n",
       " 'combined',\n",
       " 'removed',\n",
       " 'concerned',\n",
       " 'complained',\n",
       " 'accelerated',\n",
       " 'believed',\n",
       " 'called',\n",
       " 'solved',\n",
       " 'forgiven',\n",
       " 'launched',\n",
       " 'built',\n",
       " 'preferred',\n",
       " 'raised',\n",
       " 'scheduled',\n",
       " 'brought',\n",
       " 'increased',\n",
       " 'developed',\n",
       " 'led',\n",
       " 'approved',\n",
       " 'produced',\n",
       " 'denied',\n",
       " 'requested',\n",
       " 'covered',\n",
       " 'assembled',\n",
       " 'achieved',\n",
       " 'maintained',\n",
       " 'left',\n",
       " 'assisted',\n",
       " 'placed',\n",
       " 'put',\n",
       " 'linked',\n",
       " 'designed',\n",
       " 'boosted',\n",
       " 'issued',\n",
       " 'incorporated',\n",
       " 'advertised',\n",
       " 'announced',\n",
       " 'traded',\n",
       " 'registered',\n",
       " 'ranged',\n",
       " 'capped',\n",
       " 'kicked',\n",
       " 'focused',\n",
       " 'fixed',\n",
       " 'listed',\n",
       " 'turned',\n",
       " 'scrambled',\n",
       " 'outpaced',\n",
       " 'burned',\n",
       " 'clobbered',\n",
       " 'climbed',\n",
       " 'closed',\n",
       " 'skyrocketed',\n",
       " 'surged',\n",
       " 'targeted',\n",
       " 'tied',\n",
       " 'invested',\n",
       " 'jumped',\n",
       " 'alarmed',\n",
       " 'fattened',\n",
       " 'cast',\n",
       " 'repaid',\n",
       " 'permitted',\n",
       " 'crippled',\n",
       " 'lent',\n",
       " 'amended',\n",
       " 'settled',\n",
       " 'manufactured',\n",
       " 'fallen',\n",
       " 'adjusted',\n",
       " 'failed',\n",
       " 'watched',\n",
       " 'intended',\n",
       " 'helped',\n",
       " 'awarded',\n",
       " 'spent',\n",
       " 'provided',\n",
       " 'coupled',\n",
       " 'broken',\n",
       " 'rooted',\n",
       " 'written',\n",
       " 'played',\n",
       " 'welcomed',\n",
       " 'rationed',\n",
       " 'assigned',\n",
       " 'run',\n",
       " 'opened',\n",
       " 'designated',\n",
       " 'carried',\n",
       " 'surveyed',\n",
       " 'confirmed',\n",
       " 'tested',\n",
       " 'had',\n",
       " 'strapped',\n",
       " 'twinned',\n",
       " 'planned',\n",
       " 'operated',\n",
       " 'painted',\n",
       " 'accrued',\n",
       " 'swapped',\n",
       " 'laid',\n",
       " 'obsessed',\n",
       " 'revived',\n",
       " 'prepared',\n",
       " 'romanticized',\n",
       " 'Filmed',\n",
       " 'populated',\n",
       " 'condemned',\n",
       " 'given',\n",
       " 'murdered',\n",
       " 'managed',\n",
       " 'viewed',\n",
       " 'executed',\n",
       " 'presented',\n",
       " 'chopped',\n",
       " 'taken',\n",
       " 'worked',\n",
       " 'speculated',\n",
       " 'come',\n",
       " 'scattered',\n",
       " 'prompted',\n",
       " 'convicted',\n",
       " 'caught',\n",
       " 'Stung',\n",
       " 'opposed',\n",
       " 'refused',\n",
       " 'blamed',\n",
       " 'superimposed',\n",
       " 'nurtured',\n",
       " 'created',\n",
       " 'attracted',\n",
       " 'interrogated',\n",
       " 'accused',\n",
       " 'introduced',\n",
       " 'grown',\n",
       " 'gotten',\n",
       " 'rusted',\n",
       " 'involved',\n",
       " 'responded',\n",
       " 'cleaned',\n",
       " 'dumped',\n",
       " 'quoted',\n",
       " 'asked',\n",
       " 'pursued',\n",
       " 'knitted',\n",
       " 'tripled',\n",
       " 'known',\n",
       " 'spurred',\n",
       " 'seen',\n",
       " 'passed',\n",
       " 'Confronted',\n",
       " 'gone',\n",
       " 'fired',\n",
       " 'prosecuted',\n",
       " 'treated',\n",
       " 'enhanced',\n",
       " 'released',\n",
       " 'inflated',\n",
       " 'surfaced',\n",
       " 'posted',\n",
       " 'educated',\n",
       " 'faded',\n",
       " 'stabbed',\n",
       " 'chosen',\n",
       " 'learned',\n",
       " 'tried',\n",
       " 'discovered',\n",
       " 'dismissed',\n",
       " 'crowded',\n",
       " 'got',\n",
       " 'overused',\n",
       " 'expunged',\n",
       " 'interviewed',\n",
       " 'wanted',\n",
       " 'aimed',\n",
       " 'replicated',\n",
       " 'referred',\n",
       " 'matched',\n",
       " 'measured',\n",
       " 'continued',\n",
       " 'funded',\n",
       " 'threatened',\n",
       " 'embroiled',\n",
       " 'hampered',\n",
       " 'withdrawn',\n",
       " 'assured',\n",
       " 'charged',\n",
       " 'judged',\n",
       " 'polarized',\n",
       " 'Rekindled',\n",
       " 'agreed',\n",
       " 'indicated',\n",
       " 'returned',\n",
       " 'signed',\n",
       " 'acquired',\n",
       " 'associated',\n",
       " 'lost',\n",
       " 'redeemed',\n",
       " 'ended',\n",
       " 'protected',\n",
       " 'argued',\n",
       " 'heard',\n",
       " 'sent',\n",
       " 'alleged',\n",
       " 'retained',\n",
       " 'chaired',\n",
       " 'prohibited',\n",
       " 'initiated',\n",
       " 'mailed',\n",
       " 'obtained',\n",
       " 'relegated',\n",
       " 'employed',\n",
       " 'UPHELD',\n",
       " 'adopted',\n",
       " 'sparked',\n",
       " 'killed',\n",
       " 'appointed',\n",
       " 'exhibited',\n",
       " 'empowered',\n",
       " 'served',\n",
       " 'disclosed',\n",
       " 'accepted',\n",
       " 'fueled',\n",
       " 'decided',\n",
       " 'contacted',\n",
       " 'formed',\n",
       " 'compiled',\n",
       " 'Guaranteed',\n",
       " 'Related',\n",
       " 'positioned',\n",
       " 'buoyed',\n",
       " 'kept',\n",
       " 'locked',\n",
       " 'offset',\n",
       " 'convinced',\n",
       " 'mollified',\n",
       " 'valued',\n",
       " 'rolled',\n",
       " 'Estimated',\n",
       " 'flooded',\n",
       " 'pleased',\n",
       " 'Founded',\n",
       " 'alienated',\n",
       " 'chastised',\n",
       " 'printed',\n",
       " 'portrayed',\n",
       " 'relied',\n",
       " 'recycled',\n",
       " 'Asked',\n",
       " 'scared',\n",
       " 'handled',\n",
       " 'serviced',\n",
       " 'damaged',\n",
       " 'Developed',\n",
       " 'pressed',\n",
       " 'allocated',\n",
       " 'converted',\n",
       " 'mired',\n",
       " 'barred',\n",
       " 'said',\n",
       " 'equipped',\n",
       " 'classed',\n",
       " 'depressed',\n",
       " 'installed',\n",
       " 'met',\n",
       " 'enclosed',\n",
       " 'dropped',\n",
       " 'hit',\n",
       " 'reduced',\n",
       " 'limited',\n",
       " 'perceived',\n",
       " 'rarefied',\n",
       " 'zoomed',\n",
       " 'soared',\n",
       " 'commanded',\n",
       " 'exhausted',\n",
       " 'shipped',\n",
       " 'spread',\n",
       " 'talked',\n",
       " 'excited',\n",
       " 'overpriced',\n",
       " 'forced',\n",
       " 'moderated',\n",
       " 'stated',\n",
       " 'shown',\n",
       " 'described',\n",
       " 'divided',\n",
       " 'declared',\n",
       " 'exercised',\n",
       " 'postponed',\n",
       " 'rescheduled',\n",
       " 'auctioned',\n",
       " 'frozen',\n",
       " 'disappointed',\n",
       " 'eliminated',\n",
       " 'clamped',\n",
       " 'surprised',\n",
       " 'cited',\n",
       " 'subordinated',\n",
       " 'collapsed',\n",
       " 'allowed',\n",
       " 'followed',\n",
       " 'interested',\n",
       " 'purchased',\n",
       " 'escalated',\n",
       " 'stoked',\n",
       " 'publicized',\n",
       " 'identified',\n",
       " 'clarified',\n",
       " 'crossed',\n",
       " 'milked',\n",
       " 'financed',\n",
       " 'integrated',\n",
       " 'performed',\n",
       " 'assumed',\n",
       " 'competed',\n",
       " 'borrowed',\n",
       " 'squeezed',\n",
       " 'switched',\n",
       " 'cultivated',\n",
       " 'tailored',\n",
       " 'troubled',\n",
       " 'triggered',\n",
       " 'needed',\n",
       " 'synchronized',\n",
       " 'expressed',\n",
       " 'done',\n",
       " 'discussed',\n",
       " 'regulated',\n",
       " 'attached',\n",
       " 'rung',\n",
       " 'started',\n",
       " 'muffled',\n",
       " 'absorbed',\n",
       " 'mounted',\n",
       " 'filled',\n",
       " 'fed',\n",
       " 'mixed',\n",
       " 'drawn',\n",
       " 'entered',\n",
       " 'founded',\n",
       " 'remarked',\n",
       " 'observed',\n",
       " 'desired',\n",
       " 'dressed',\n",
       " 'decorated',\n",
       " 'unsettled',\n",
       " 'risen',\n",
       " 'Put',\n",
       " 'sustained',\n",
       " 'tanked',\n",
       " 'renewed',\n",
       " 'invented',\n",
       " 'infringed',\n",
       " 'hired',\n",
       " 'afflicted',\n",
       " 'deteriorated',\n",
       " 'codified',\n",
       " 'gained',\n",
       " 'discarded',\n",
       " 'pointed',\n",
       " 'loaded',\n",
       " 'defined',\n",
       " 'expelled',\n",
       " 'suspended',\n",
       " 'fined',\n",
       " 'represented',\n",
       " 'consented',\n",
       " 'owed',\n",
       " 'Reached',\n",
       " 'rectified',\n",
       " 'noted',\n",
       " 'engaged',\n",
       " 'blocked',\n",
       " 'forgotten',\n",
       " 'tightened',\n",
       " 'reaped',\n",
       " 'stopped',\n",
       " 'pegged',\n",
       " 'backed',\n",
       " 'enacted',\n",
       " 'sought',\n",
       " 'touted',\n",
       " 'faced',\n",
       " 'negotiated',\n",
       " 'Given',\n",
       " 'impressed',\n",
       " 'engineered',\n",
       " 'hurt',\n",
       " 'diversified',\n",
       " 'expanded',\n",
       " 'committed',\n",
       " 'provoked',\n",
       " 'confined',\n",
       " 'stripped',\n",
       " 'reallocated',\n",
       " 'instructed',\n",
       " 'drafted',\n",
       " 'repaired',\n",
       " 'upset',\n",
       " 'altered',\n",
       " 'corrected',\n",
       " 'promised',\n",
       " 'proved',\n",
       " 'understood',\n",
       " 'composed',\n",
       " 'connected',\n",
       " 'regarded',\n",
       " 'robbed',\n",
       " 'deprived',\n",
       " 'organized',\n",
       " 'impaired',\n",
       " 'diminished',\n",
       " 'added',\n",
       " 'advised',\n",
       " 'mentioned',\n",
       " 'answered',\n",
       " 'oriented',\n",
       " 'contributed',\n",
       " 'dominated',\n",
       " 'pushed',\n",
       " 'OFFERED',\n",
       " 'Posted',\n",
       " 'Annualized',\n",
       " 'clashed',\n",
       " 'enjoyed',\n",
       " 'included',\n",
       " 'recruited',\n",
       " 'rumored',\n",
       " 'respected',\n",
       " 'Provided',\n",
       " 'specified',\n",
       " 'predicated',\n",
       " 'endorsed',\n",
       " 'construed',\n",
       " 'supported',\n",
       " 'read',\n",
       " 'contained',\n",
       " 'nominated',\n",
       " 'wasted',\n",
       " 'favored',\n",
       " 'disapproved',\n",
       " 'ratified',\n",
       " 'characterized',\n",
       " 'won',\n",
       " 'entrusted',\n",
       " 'mortgaged',\n",
       " 'reclaimed',\n",
       " 'parched',\n",
       " 'cushioned',\n",
       " 'shut',\n",
       " 'attempted',\n",
       " 'torn',\n",
       " 'staid',\n",
       " 'flirted',\n",
       " 'abandoned',\n",
       " 'stepped',\n",
       " 'headlined',\n",
       " 'secured',\n",
       " 'beleaguered',\n",
       " 'begun',\n",
       " 'plunged',\n",
       " 'missed',\n",
       " 'preapproved',\n",
       " 'upheld',\n",
       " 'accounted',\n",
       " 'vested',\n",
       " 'shaken',\n",
       " 'heated',\n",
       " 'labeled',\n",
       " 'exacerbated',\n",
       " 'wedded',\n",
       " 'headed',\n",
       " 'curbed',\n",
       " 'entrenched',\n",
       " 'stacked',\n",
       " 'frightened',\n",
       " 'automated',\n",
       " 'earned',\n",
       " 'spooked',\n",
       " 'transformed',\n",
       " 'orchestrated',\n",
       " 'gored',\n",
       " 'proven',\n",
       " 'minted',\n",
       " 'beaten',\n",
       " 'practiced',\n",
       " 'implemented',\n",
       " 'feared',\n",
       " 'Left',\n",
       " 'cut',\n",
       " 'appropriated',\n",
       " 'noticed',\n",
       " 'finished',\n",
       " 'documented',\n",
       " 'colored',\n",
       " 'Funded',\n",
       " 'Concerned',\n",
       " 'marketed',\n",
       " 'echoed',\n",
       " 'halted',\n",
       " 'recouped',\n",
       " 'hunted',\n",
       " 'cooled',\n",
       " 'overcome',\n",
       " 'terminated',\n",
       " 'Rated',\n",
       " 'insured',\n",
       " 'rated',\n",
       " 'looked',\n",
       " 'justified',\n",
       " 'discontinued',\n",
       " 'lowered',\n",
       " 'warned',\n",
       " 'structured',\n",
       " 'generated',\n",
       " 'overstated',\n",
       " 'midsized',\n",
       " 'assessed',\n",
       " 'chilled',\n",
       " 'hidden',\n",
       " 'inserted',\n",
       " 'harmed',\n",
       " 'stressed',\n",
       " 'selected',\n",
       " 'directed',\n",
       " 'stimulated',\n",
       " 'bolstered',\n",
       " 'overdone',\n",
       " 'calculated',\n",
       " 'Named',\n",
       " 'revised',\n",
       " 'attributed',\n",
       " 'conducted',\n",
       " 'snapped',\n",
       " 'polled',\n",
       " 'topped',\n",
       " 'outdistanced',\n",
       " 'relaunched',\n",
       " 'restructured',\n",
       " 'repriced',\n",
       " 'concluded',\n",
       " 'hailed',\n",
       " 'despised',\n",
       " 'heightened',\n",
       " 'Used',\n",
       " 'nullified',\n",
       " 'puzzled',\n",
       " 'bought',\n",
       " 'notified',\n",
       " 'merged',\n",
       " 'delisted',\n",
       " 'meant',\n",
       " 'own',\n",
       " 'tendered',\n",
       " 'singled',\n",
       " 'granted',\n",
       " 'felt',\n",
       " 'confused',\n",
       " 'complicated',\n",
       " 'muted',\n",
       " 'Continued',\n",
       " 'split',\n",
       " 'diluted',\n",
       " 'magnified',\n",
       " 'reimbursed',\n",
       " 'subdued',\n",
       " 'controlled',\n",
       " 'liquidated',\n",
       " 'distributed',\n",
       " 'experienced',\n",
       " 'customized',\n",
       " 'extended',\n",
       " 'sweetened',\n",
       " 'derived',\n",
       " 'averted',\n",
       " 'slated',\n",
       " 'delivered',\n",
       " 'capitalized',\n",
       " 'examined',\n",
       " 'reorganized',\n",
       " 'plagued',\n",
       " 'imposed',\n",
       " 'armed',\n",
       " 'rigged',\n",
       " 'subpoenaed',\n",
       " 'planted',\n",
       " 'told',\n",
       " 'centralized',\n",
       " 'resulted',\n",
       " 'forecast',\n",
       " 'fizzled',\n",
       " 'edged',\n",
       " 'battered',\n",
       " 'floated',\n",
       " 'spun',\n",
       " 'licensed',\n",
       " 'qualified',\n",
       " 'specialized',\n",
       " 'trimmed',\n",
       " 'detailed',\n",
       " 'born',\n",
       " 'fashioned',\n",
       " 'bribed',\n",
       " 'arrested',\n",
       " 'Absorbed',\n",
       " 'finalized',\n",
       " 'dashed',\n",
       " 'omitted',\n",
       " 'harvested',\n",
       " 'slowed',\n",
       " 'depleted',\n",
       " 'obligated',\n",
       " 'compressed',\n",
       " 'delayed',\n",
       " 'influenced',\n",
       " 'reflected',\n",
       " 'advanced',\n",
       " 'coated',\n",
       " 'shared']"
      ]
     },
     "execution_count": 86,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(cfd2['VBN'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "cfd1 = nltk.ConditionalFreqDist(wsj)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['named',\n",
       " 'used',\n",
       " 'caused',\n",
       " 'reported',\n",
       " 'said',\n",
       " 'stopped',\n",
       " 'heard',\n",
       " 'studied',\n",
       " 'led',\n",
       " 'replaced',\n",
       " 'sold',\n",
       " 'worked',\n",
       " 'died',\n",
       " 'found',\n",
       " 'rejected',\n",
       " 'imposed',\n",
       " 'made',\n",
       " 'dumped',\n",
       " 'imported',\n",
       " 'mixed',\n",
       " 'described',\n",
       " 'continued',\n",
       " 'ended',\n",
       " 'thought',\n",
       " 'reached',\n",
       " 'had',\n",
       " 'approved',\n",
       " 'completed',\n",
       " 'suspended',\n",
       " 'lifted',\n",
       " 'dropped',\n",
       " 'voted',\n",
       " 'settled',\n",
       " 'decided',\n",
       " 'followed',\n",
       " 'welcomed',\n",
       " 'held',\n",
       " 'banned',\n",
       " 'pointed',\n",
       " 'squeezed',\n",
       " 'fed',\n",
       " 'registered',\n",
       " 'released',\n",
       " 'increased',\n",
       " 'forecast',\n",
       " 'recorded',\n",
       " 'announced',\n",
       " 'offered',\n",
       " 'lowered',\n",
       " 'spent',\n",
       " 'proposed',\n",
       " 'got',\n",
       " 'added',\n",
       " 'noted',\n",
       " 'turned',\n",
       " 'closed',\n",
       " 'retired',\n",
       " 'ordered',\n",
       " 'required',\n",
       " 'received',\n",
       " 'moved',\n",
       " 'determined',\n",
       " 'changed',\n",
       " 'upheld',\n",
       " 'set',\n",
       " 'estimated',\n",
       " 'compared',\n",
       " 'opened',\n",
       " 'tied',\n",
       " 'filed',\n",
       " 'disclosed',\n",
       " 'anticipated',\n",
       " 'attached',\n",
       " 'called',\n",
       " 'applied',\n",
       " 'favored',\n",
       " 'posted',\n",
       " 'paid',\n",
       " 'removed',\n",
       " 'accelerated',\n",
       " 'placed',\n",
       " 'vowed',\n",
       " 'deemed',\n",
       " 'prompted',\n",
       " 'complained',\n",
       " 'believed',\n",
       " 'met',\n",
       " 'solved',\n",
       " 'launched',\n",
       " 'built',\n",
       " 'triggered',\n",
       " 'developed',\n",
       " 'entered',\n",
       " 'acquired',\n",
       " 'preferred',\n",
       " 'raised',\n",
       " 'scheduled',\n",
       " 'brought',\n",
       " 'started',\n",
       " 'produced',\n",
       " 'denied',\n",
       " 'covered',\n",
       " 'maintained',\n",
       " 'left',\n",
       " 'cut',\n",
       " 'bought',\n",
       " 'snapped',\n",
       " 'put',\n",
       " 'boosted',\n",
       " 'issued',\n",
       " 'agreed',\n",
       " 'surged',\n",
       " 'ranged',\n",
       " 'kicked',\n",
       " 'scrambled',\n",
       " 'plunged',\n",
       " 'climbed',\n",
       " 'invested',\n",
       " 'jumped',\n",
       " 'owed',\n",
       " 'lent',\n",
       " 'stressed',\n",
       " 'failed',\n",
       " 'indicated',\n",
       " 'asked',\n",
       " 'intended',\n",
       " 'helped',\n",
       " 'awarded',\n",
       " 'purchased',\n",
       " 'provided',\n",
       " 'polled',\n",
       " 'included',\n",
       " 'blamed',\n",
       " 'contributed',\n",
       " 'read',\n",
       " 'fired',\n",
       " 'committed',\n",
       " 'learned',\n",
       " 'carried',\n",
       " 'identified',\n",
       " 'endorsed',\n",
       " 'renewed',\n",
       " 'confirmed',\n",
       " 'terminated',\n",
       " 'planned',\n",
       " 'contained',\n",
       " 'condemned',\n",
       " 'managed',\n",
       " 'viewed',\n",
       " 'needed',\n",
       " 'killed',\n",
       " 'presented',\n",
       " 'speculated',\n",
       " 'hit',\n",
       " 'opposed',\n",
       " 'refused',\n",
       " 'wanted',\n",
       " 'created',\n",
       " 'introduced',\n",
       " 'accused',\n",
       " 'tried',\n",
       " 'involved',\n",
       " 'responded',\n",
       " 'quoted',\n",
       " 'tripled',\n",
       " 'passed',\n",
       " 'matched',\n",
       " 'won',\n",
       " 'treated',\n",
       " 'alleged',\n",
       " 'concluded',\n",
       " 'surfaced',\n",
       " 'restructured',\n",
       " 'advised',\n",
       " 'told',\n",
       " 'feared',\n",
       " 'meant',\n",
       " 'returned',\n",
       " 'advanced',\n",
       " 'discovered',\n",
       " 'dismissed',\n",
       " 'allowed',\n",
       " 'aimed',\n",
       " 'referred',\n",
       " 'represented',\n",
       " 'threatened',\n",
       " 'controlled',\n",
       " 'hampered',\n",
       " 'nominated',\n",
       " 'assured',\n",
       " 'damaged',\n",
       " 'gained',\n",
       " 'merged',\n",
       " 'signed',\n",
       " 'lost',\n",
       " 'argued',\n",
       " 'sent',\n",
       " 'formed',\n",
       " 'obtained',\n",
       " 'mounted',\n",
       " 'adopted',\n",
       " 'sparked',\n",
       " 'served',\n",
       " 'understood',\n",
       " 'accepted',\n",
       " 'fueled',\n",
       " 'limited',\n",
       " 'Asked',\n",
       " 'extended',\n",
       " 'kept',\n",
       " 'rolled',\n",
       " 'chastised',\n",
       " 'printed',\n",
       " 'expanded',\n",
       " 'sweetened',\n",
       " 'barred',\n",
       " 'reduced',\n",
       " 'declared',\n",
       " 'soared',\n",
       " 'remarked',\n",
       " 'forced',\n",
       " 'stated',\n",
       " 'finished',\n",
       " 'eliminated',\n",
       " 'cited',\n",
       " 'collapsed',\n",
       " 'earned',\n",
       " 'licensed',\n",
       " 'secured',\n",
       " 'omitted',\n",
       " 'assumed',\n",
       " 'stepped',\n",
       " 'switched',\n",
       " 'felt',\n",
       " 'expressed',\n",
       " 'discussed',\n",
       " 'invented',\n",
       " 'observed',\n",
       " 'hired',\n",
       " 'expelled',\n",
       " 'consented',\n",
       " 'backed',\n",
       " 'reflected',\n",
       " 'sought',\n",
       " 'negotiated',\n",
       " 'resulted',\n",
       " 'proved',\n",
       " 'examined',\n",
       " 'dominated',\n",
       " 'pushed',\n",
       " 'supported',\n",
       " 'attributed',\n",
       " 'attempted',\n",
       " 'obligated',\n",
       " 'halted',\n",
       " 'transformed',\n",
       " 'marketed',\n",
       " 'rated',\n",
       " 'warned',\n",
       " 'edged',\n",
       " 'bribed']"
      ]
     },
     "execution_count": 94,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[w for w in cfd1.conditions() if 'VBD' in cfd1[w] and 'VBN' in cfd1[w]]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "idx1 = wsj.index(('kicked', 'VBD'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('While', 'IN'),\n",
       " ('program', 'NN'),\n",
       " ('trades', 'NNS'),\n",
       " ('swiftly', 'RB'),\n",
       " ('kicked', 'VBD')]"
      ]
     },
     "execution_count": 96,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wsj[idx1-4:idx1+1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "idx2 = wsj.index(('kicked', 'VBN'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('head', 'NN'),\n",
       " ('of', 'IN'),\n",
       " ('state', 'NN'),\n",
       " ('has', 'VBZ'),\n",
       " ('kicked', 'VBN')]"
      ]
     },
     "execution_count": 98,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "wsj[idx2-4:idx2+1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def findtags(tag_prefix, tagged_text):\n",
    "    cfd = nltk.ConditionalFreqDist((tag, word) for (word, tag) in tagged_text if tag.startswith(tag_prefix))\n",
    "    return dict((tag, cfd[tag].most_common(5)) for tag in cfd.conditions())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tagdict = findtags('NN', nltk.corpus.brown.tagged_words(categories='news'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "NN [('year', 137), ('time', 97), ('state', 88), ('week', 85), ('man', 72)]\n",
      "NN$ [(\"year's\", 13), (\"world's\", 8), (\"state's\", 7), (\"nation's\", 6), (\"city's\", 6)]\n",
      "NN$-HL [(\"Golf's\", 1), (\"Navy's\", 1)]\n",
      "NN$-TL [(\"President's\", 11), (\"Administration's\", 3), (\"Army's\", 3), (\"League's\", 3), (\"University's\", 3)]\n",
      "NN-HL [('sp.', 2), ('problem', 2), ('Question', 2), ('cut', 2), ('party', 2)]\n",
      "NN-NC [('ova', 1), ('eva', 1), ('aya', 1)]\n",
      "NN-TL [('President', 88), ('House', 68), ('State', 59), ('University', 42), ('City', 41)]\n",
      "NN-TL-HL [('Fort', 2), ('Mayor', 1), ('Commissioner', 1), ('City', 1), ('Oak', 1)]\n",
      "NNS [('years', 101), ('members', 69), ('people', 52), ('sales', 51), ('men', 46)]\n",
      "NNS$ [(\"children's\", 7), (\"women's\", 5), (\"men's\", 3), (\"janitors'\", 3), (\"taxpayers'\", 2)]\n",
      "NNS$-HL [(\"Dealers'\", 1), (\"Idols'\", 1)]\n",
      "NNS$-TL [(\"Women's\", 4), (\"States'\", 3), (\"Giants'\", 2), (\"Princes'\", 1), (\"Bombers'\", 1)]\n",
      "NNS-HL [('Wards', 1), ('deputies', 1), ('bonds', 1), ('aspects', 1), ('Decisions', 1)]\n",
      "NNS-TL [('States', 38), ('Nations', 11), ('Masters', 10), ('Communists', 9), ('Rules', 9)]\n",
      "NNS-TL-HL [('Nations', 1)]\n"
     ]
    }
   ],
   "source": [
    "for tag in sorted(tagdict):\n",
    "    print(tag, tagdict[tag])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {},
   "outputs": [],
   "source": [
    "brown_learned_text = brown.words(categories='learned')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 105,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[',',\n",
       " '.',\n",
       " 'accomplished',\n",
       " 'analytically',\n",
       " 'appear',\n",
       " 'apt',\n",
       " 'associated',\n",
       " 'assuming',\n",
       " 'became',\n",
       " 'become',\n",
       " 'been',\n",
       " 'began',\n",
       " 'call',\n",
       " 'called',\n",
       " 'carefully',\n",
       " 'chose',\n",
       " 'classified',\n",
       " 'colorful',\n",
       " 'composed',\n",
       " 'contain',\n",
       " 'differed',\n",
       " 'difficult',\n",
       " 'encountered',\n",
       " 'enough',\n",
       " 'equate',\n",
       " 'extremely',\n",
       " 'found',\n",
       " 'happens',\n",
       " 'have',\n",
       " 'ignored',\n",
       " 'in',\n",
       " 'involved',\n",
       " 'more',\n",
       " 'needed',\n",
       " 'nightly',\n",
       " 'observed',\n",
       " 'of',\n",
       " 'on',\n",
       " 'out',\n",
       " 'quite',\n",
       " 'represent',\n",
       " 'responsible',\n",
       " 'revamped',\n",
       " 'seclude',\n",
       " 'set',\n",
       " 'shortened',\n",
       " 'sing',\n",
       " 'sounded',\n",
       " 'stated',\n",
       " 'still',\n",
       " 'sung',\n",
       " 'supported',\n",
       " 'than',\n",
       " 'to',\n",
       " 'when',\n",
       " 'work']"
      ]
     },
     "execution_count": 105,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sorted(set(b for (a, b) in nltk.bigrams(brown_learned_text) if a == 'often'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 106,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "brown_lrnd_tagged = brown.tagged_words(categories='learned', tagset='universal')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tags = [b[1] for (a, b) in nltk.bigrams(brown_lrnd_tagged) if a[0] == 'often']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "fd = nltk.FreqDist(tags)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "VERB  ADV  ADP  ADJ    .  PRT \n",
      "  37    8    7    6    4    2 \n"
     ]
    }
   ],
   "source": [
    "fd.tabulate()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 111,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "# 搜索 动词词组 verb to verb\n",
    "def process(sentence):\n",
    "    for (w1, t1), (w2, t2), (w3, t3) in nltk.trigrams(sentence):\n",
    "        if (t1.startswith('V') and t2 == 'TO' and t3.startswith('V')):\n",
    "            print(w1, w2, w3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "combined to achieve\n",
      "continue to place\n",
      "serve to protect\n",
      "wanted to wait\n",
      "allowed to place\n",
      "expected to become\n",
      "expected to approve\n",
      "expected to make\n",
      "intends to make\n",
      "seek to set\n",
      "like to see\n",
      "designed to provide\n",
      "get to hear\n",
      "expects to tell\n",
      "expected to give\n",
      "prefer to pay\n",
      "required to obtain\n",
      "permitted to teach\n",
      "designed to reduce\n",
      "Asked to elaborate\n",
      "got to go\n",
      "raised to pay\n",
      "scheduled to go\n",
      "cut to meet\n",
      "needed to meet\n",
      "hastened to add\n",
      "found to prevent\n",
      "continue to insist\n",
      "compelled to make\n",
      "made to remove\n",
      "revamped to give\n",
      "want to risk\n",
      "appear to spark\n",
      "fails to consider\n",
      "plans to call\n",
      "going to examine\n",
      "plans to name\n",
      "come to pass\n",
      "voted to accept\n",
      "happens to hold\n",
      "authorized to adopt\n",
      "hesitated to prosecute\n",
      "try to make\n",
      "decided to spend\n",
      "taken to preserve\n",
      "left to preserve\n",
      "stand to bring\n",
      "decided to seek\n",
      "trying to induce\n",
      "proposing to make\n",
      "decided to run\n",
      "directed to investigate\n",
      "expected to pass\n",
      "expected to make\n",
      "expected to encounter\n",
      "hopes to pass\n",
      "came to pay\n",
      "expected to receive\n",
      "understood to follow\n",
      "wanted to vote\n",
      "decide to call\n",
      "begin to flow\n",
      "appears to face\n",
      "fails to pass\n",
      "care to acknowledge\n",
      "like to convey\n",
      "continued to wage\n",
      "try to avoid\n",
      "done to arouse\n",
      "tried to economize\n",
      "agreed to cooperate\n",
      "want to find\n",
      "expected to raise\n",
      "agreed to form\n",
      "threatened to form\n",
      "failed to sign\n",
      "trying to build\n",
      "plan to absorb\n",
      "working to establish\n",
      "expects to evacuate\n",
      "need to hear\n",
      "scheduled to hold\n",
      "decided to ask\n",
      "scheduled to fill\n",
      "going to determine\n",
      "urged to move\n",
      "conpired to use\n",
      "used to carry\n",
      "needed to face\n",
      "failed to tally\n",
      "failed to produce\n",
      "tried to stretch\n",
      "hopes to melt\n",
      "slated to oppose\n",
      "scheduled to share\n",
      "plans to bring\n",
      "seek to trim\n",
      "seems to improve\n",
      "appeared to win\n",
      "gets to play\n",
      "hopes to start\n",
      "tried to teach\n",
      "seem to get\n",
      "started to form\n",
      "like to keep\n",
      "want to talk\n",
      "continue to abide\n",
      "refused to reconsider\n",
      "expected to put\n",
      "resigned to take\n",
      "sought to convince\n",
      "tried to blast\n",
      "tried to keep\n",
      "happened to think\n",
      "expected to continue\n",
      "plans to open\n",
      "recovering to make\n",
      "supposed to deliver\n",
      "get to like\n",
      "want to thank\n",
      "set to play\n",
      "going to pass\n",
      "paid to play\n",
      "wanted to pop\n",
      "expect to establish\n",
      "going to try\n",
      "try to get\n",
      "signed to play\n",
      "fly to collect\n",
      "helps to bridge\n",
      "wants to pick\n",
      "relearns to mingle\n",
      "watching to see\n",
      "learn to readjust\n",
      "promises to follow\n",
      "expect to offer\n",
      "like to come\n",
      "like to bring\n",
      "combined to form\n",
      "chosen to rule\n",
      "attempted to stop\n",
      "required to use\n",
      "prepared to grant\n",
      "refused to return\n",
      "demanded to know\n",
      "decided to end\n",
      "offered to supply\n",
      "designed to seek\n",
      "get to know\n",
      "get to know\n",
      "going to call\n",
      "attempted to end\n",
      "forbidden to drive\n",
      "failed to reach\n",
      "wish to appear\n",
      "hopes to rebuild\n",
      "used to provide\n",
      "wanted to make\n",
      "trying to land\n",
      "prepared to accept\n",
      "continue to operate\n",
      "taken to overcome\n",
      "intend to make\n",
      "desiring to study\n",
      "designed to assure\n",
      "intend to attend\n",
      "failed to cooperate\n",
      "agree to attend\n",
      "decided to attend\n",
      "scheduled to begin\n",
      "agreed to meet\n",
      "failed to show\n",
      "declined to name\n",
      "tried to subdue\n",
      "planning to expand\n",
      "thought to infest\n",
      "voted to decertify\n",
      "designed to give\n",
      "continued to run\n",
      "failed to place\n",
      "started to turn\n",
      "bought to provide\n",
      "asked to set\n",
      "vote to appeal\n",
      "failed to reach\n",
      "failed to destroy\n",
      "encouraged to try\n",
      "try to get\n",
      "managed to maneuver\n",
      "obligated to make\n",
      "promised to get\n",
      "attempting to connect\n",
      "prepared to answer\n",
      "failed to report\n",
      "attempted to cash\n",
      "wanting to get\n",
      "combined to make\n",
      "continue to grab\n",
      "designed to provide\n",
      "appear to favor\n",
      "declined to suggest\n",
      "expected to advance\n",
      "required to reach\n",
      "fail to give\n",
      "began to come\n",
      "undertake to reply\n",
      "found to deal\n",
      "forced to buy\n",
      "starting to get\n",
      "inclined to explain\n",
      "supposed to look\n",
      "chose to take\n",
      "used to emphasize\n",
      "seem to realize\n",
      "happen to grow\n",
      "tried to compromise\n",
      "scheduled to arrive\n",
      "prefer to see\n",
      "set to open\n",
      "expected to prove\n",
      "try to influence\n",
      "strive to set\n",
      "decided to try\n",
      "try to let\n",
      "asked to read\n",
      "prepared to demonstrate\n",
      "led to believe\n",
      "went to see\n",
      "begun to pall\n",
      "going to get\n",
      "painted to match\n",
      "appointed to serve\n",
      "expected to register\n",
      "failed to materialize\n",
      "wanted to buy\n",
      "begin to implement\n",
      "tended to confirm\n",
      "want to appear\n",
      "try to probe\n",
      "determined to apply\n",
      "come to warn\n",
      "known to rely\n",
      "try to exploit\n",
      "tended to cancel\n",
      "cease to marvel\n",
      "seem to represent\n",
      "seems to show\n",
      "declines to gamble\n",
      "needs to feel\n",
      "advanced to argue\n",
      "undertakes to fight\n",
      "decided to keep\n",
      "advertising to attract\n",
      "wants to operate\n",
      "varied to provide\n",
      "designed to reduce\n",
      "use to deny\n",
      "combining to lower\n",
      "combining to raise\n",
      "intended to effect\n",
      "tend to convert\n",
      "exist to raise\n",
      "wish to prevent\n",
      "wish to preserve\n",
      "attempting to extend\n",
      "made to take\n",
      "continue to set\n",
      "trying to persuade\n",
      "attempted to take\n",
      "decided to break\n",
      "braced to move\n",
      "needed to keep\n",
      "used to carry\n",
      "decided to go\n",
      "happens to benefit\n",
      "attempted to work\n",
      "decided to join\n",
      "said to regard\n",
      "sought to bring\n",
      "want to give\n",
      "voting to cut\n",
      "prepared to choke\n",
      "used to approach\n",
      "trying to hit\n",
      "refused to let\n",
      "began to acquire\n",
      "proceeded to sink\n",
      "proceeded to follow\n",
      "hoping to slice\n",
      "chose to hit\n",
      "like to hit\n",
      "tries to answer\n",
      "want to talk\n",
      "got to get\n",
      "used to follow\n",
      "try to play\n",
      "conspired to lose\n",
      "needed to revive\n",
      "chosen to run\n",
      "hopes to visit\n",
      "got to see\n",
      "arranged to sell\n",
      "delighted to get\n",
      "want to enjoy\n",
      "tried to get\n",
      "try to close\n",
      "required to furnish\n",
      "obliged to dole\n",
      "wished to wait\n",
      "decided to act\n",
      "hoped to attend\n",
      "like to woo\n",
      "prepared to discuss\n",
      "wanted to go\n",
      "allowed to file\n",
      "tried to persuade\n",
      "began to tell\n",
      "hoped to peddle\n",
      "intended to insure\n",
      "decided to provide\n",
      "expected to go\n",
      "expected to sign\n",
      "like to eat\n",
      "like to talk\n",
      "ceased to grumble\n",
      "tending to bid\n",
      "start to pay\n",
      "failed to measure\n",
      "going to take\n",
      "needed to push\n",
      "trying to get\n",
      "try to get\n",
      "want to increase\n",
      "wants to bring\n",
      "threaten to strike\n",
      "begun to grow\n",
      "combine to serve\n",
      "helping to strengthen\n",
      "designed to promote\n",
      "threatening to expand\n",
      "seeks to get\n",
      "begin to see\n",
      "continue to expand\n",
      "failing to render\n",
      "decided to tackle\n",
      "expects to sign\n",
      "tends to become\n",
      "came to understand\n",
      "deserve to breathe\n",
      "advised to seek\n",
      "attempting to make\n",
      "try to gun\n",
      "began to fill\n",
      "proposes to preserve\n",
      "asked to approve\n",
      "seeking to break\n",
      "tends to spread\n",
      "want to amend\n",
      "rejected to seek\n",
      "continued to speak\n",
      "trying to make\n",
      "expected to head\n",
      "tempted to let\n",
      "appear to cost\n",
      "attempt to shore\n",
      "seeking to achieve\n",
      "expected to report\n",
      "born to play\n",
      "promising to build\n",
      "minded to read\n",
      "hope to win\n",
      "threatened to ignite\n",
      "beginning to take\n",
      "flew to exert\n",
      "proceed to validate\n",
      "continues to feel\n",
      "want to make\n",
      "going to get\n",
      "attempt to rewrite\n",
      "purport to advocate\n",
      "seeking to capitalize\n",
      "exist to aid\n",
      "learn to put\n",
      "tends to create\n",
      "promised to eat\n",
      "hopes to include\n",
      "moving to create\n",
      "prepared to undertake\n",
      "conspired to overthrow\n",
      "seem to feel\n",
      "decided to keep\n",
      "applied to serve\n",
      "try to seize\n",
      "lead to involving\n",
      "cut to allow\n",
      "hope to enjoy\n",
      "likes to receive\n",
      "delighted to learn\n",
      "going to expand\n",
      "authorized to deliver\n",
      "going to can\n",
      "going to close\n",
      "supposed to make\n",
      "try to raise\n",
      "tried to settle\n",
      "pass to enter\n",
      "came to tell\n",
      "wanted to grab\n",
      "stops to think\n",
      "expect to get\n",
      "chosen to answer\n",
      "motivated to seek\n",
      "disposed to covet\n",
      "like to lie\n",
      "going to tell\n",
      "prepared to accept\n",
      "try to stop\n",
      "try to stop\n",
      "sought to break\n",
      "inclined to look\n",
      "begun to act\n",
      "elect to slow\n",
      "like to challenge\n",
      "going to move\n",
      "asked to carry\n",
      "expect to stop\n",
      "expect to reduce\n",
      "expected to supply\n",
      "supposed to win\n",
      "seems to lack\n",
      "tends to treat\n",
      "like to share\n",
      "try to treat\n",
      "try to bring\n",
      "try to give\n",
      "continue to lack\n",
      "learn to color\n",
      "slated to replace\n",
      "strive to put\n",
      "intends to provide\n",
      "try to solve\n",
      "decided to use\n",
      "try to end\n",
      "going to take\n",
      "trying to organize\n",
      "permitted to repair\n",
      "trying to find\n",
      "planned to rival\n",
      "seems to speak\n",
      "tried to dissuade\n",
      "tends to shimmy\n",
      "designed to teach\n",
      "prepared to teach\n",
      "wanted to sign\n",
      "made to act\n",
      "continue to influence\n",
      "begins to notice\n",
      "expected to win\n",
      "seek to find\n",
      "join to defeat\n",
      "meant to repeat\n",
      "trying to downgrade\n",
      "tried to guard\n",
      "want to separate\n",
      "seem to indicate\n",
      "afford to buy\n",
      "try to develop\n",
      "attempting to attract\n",
      "compelled to write\n",
      "failed to set\n",
      "continue to shape\n",
      "wants to study\n",
      "wants to study\n",
      "equipped to care\n",
      "expected to survive\n",
      "shocked to see\n",
      "going to play\n",
      "voted to aid\n",
      "died to uphold\n",
      "urged to reduce\n",
      "wish to state\n",
      "expected to give\n",
      "trying to maintain\n",
      "attempt to seek\n",
      "wishes to commend\n",
      "qualified to teach\n",
      "want to let\n",
      "informed to report\n",
      "planning to shelter\n",
      "plans to sit\n",
      "continue to inquire\n",
      "began to realize\n",
      "refuse to acknowledge\n",
      "required to certify\n",
      "desire to participate\n",
      "hasten to join\n",
      "like to question\n",
      "needed to help\n",
      "prepared to care\n",
      "like to suggest\n",
      "fear to negotiate\n",
      "tried to prevent\n",
      "refusing to pay\n",
      "like to quote\n",
      "transfer to ride\n",
      "managed to automate\n",
      "expected to pay\n",
      "collected to buy\n",
      "continue to provide\n",
      "wish to congratulate\n",
      "help to turn\n",
      "try to keep\n",
      "try to frighten\n",
      "wish to advocate\n",
      "expect to see\n",
      "refuse to aid\n",
      "needs to stand\n",
      "strives to emulate\n",
      "refusing to show\n",
      "seems to match\n",
      "decided to rake\n",
      "entitled to stay\n",
      "bringing to bear\n",
      "beginning to get\n",
      "threaten to use\n",
      "begin to play\n",
      "begin to hunt\n",
      "induced to see\n",
      "going to hang\n",
      "continue to test\n",
      "choose to agree\n",
      "chosen to find\n",
      "compelled to conduct\n",
      "need to realize\n",
      "used to justify\n",
      "fail to respond\n",
      "intends to economize\n",
      "bound to say\n",
      "trying to mollify\n",
      "used to say\n",
      "came to reassert\n",
      "choose to call\n",
      "intend to re-enter\n",
      "conscripted to enact\n",
      "continues to feed\n",
      "tried to integrate\n",
      "poised to strike\n",
      "try to force\n",
      "attempting to reach\n",
      "afford to take\n",
      "forbidden to sit\n",
      "plans to import\n",
      "likes to imagine\n",
      "used to get\n",
      "trying to make\n",
      "ceased to suggest\n",
      "going to work\n",
      "wanting to cut\n",
      "choose to persuade\n",
      "trying to keep\n",
      "like to embark\n",
      "suited to defeat\n",
      "hastened to put\n",
      "like to add\n",
      "want to preserve\n",
      "required to participate\n",
      "happened to save\n",
      "doing to promote\n",
      "tempted to quote\n",
      "continuing to capture\n",
      "need to communicate\n",
      "like to see\n",
      "interested to know\n",
      "allowed to rust\n",
      "chose to devote\n",
      "left to choose\n",
      "want to own\n",
      "plan to become\n",
      "persuaded to restock\n",
      "seems to improve\n",
      "arranged to permit\n",
      "seem to lend\n",
      "allowed to mix\n",
      "starts to swing\n",
      "seems to stop\n",
      "ordered to hold\n",
      "fitted to endure\n",
      "trying to follow\n",
      "threatening to explode\n",
      "rides to break\n",
      "managed to make\n",
      "dancing to display\n",
      "hasten to report\n",
      "seems to come\n",
      "reassuring to see\n",
      "profess to know\n",
      "help to explain\n",
      "forced to rely\n",
      "attempt to homogenize\n",
      "like to put\n",
      "continue to try\n",
      "try to come\n",
      "seem to deal\n",
      "decide to let\n",
      "tries to take\n",
      "trying to forget\n",
      "trying to acquire\n",
      "threatens to linger\n",
      "decided to forego\n",
      "managed to hold\n",
      "intended to illustrate\n",
      "tried to get\n",
      "learn to live\n",
      "helping to move\n",
      "striving to hold\n",
      "choose to work\n",
      "tried to see\n",
      "trying to create\n",
      "made to appear\n",
      "failed to make\n",
      "seemed to deserve\n",
      "managed to mix\n",
      "want to hurt\n",
      "liked to nip\n",
      "manages to acquire\n",
      "widened to enchant\n",
      "serve to contradict\n",
      "dare to experiment\n",
      "tried to humanize\n",
      "tries to preserve\n",
      "helps to rebut\n",
      "seems to make\n",
      "began to play\n",
      "cares to remember\n",
      "serve to show\n",
      "want to collect\n",
      "designed to invite\n",
      "attempt to make\n",
      "designed to belong\n",
      "seem to come\n",
      "wanted to identify\n",
      "neglect to cultivate\n",
      "chooses to lead\n",
      "chosen to sing\n",
      "expected to follow\n",
      "formed to spur\n",
      "tends to shy\n",
      "seeking to become\n",
      "tries to make\n",
      "began to change\n",
      "try to solve\n",
      "formed to fill\n",
      "determined to avoid\n",
      "seems to work\n",
      "began to fall\n",
      "began to depart\n",
      "refused to give\n",
      "like to sniff\n",
      "continue to demonstrate\n",
      "begins to wilt\n",
      "going to murder\n",
      "trying to puzzle\n",
      "expects to profit\n",
      "chooses to die\n",
      "wishes to pay\n",
      "conditioned to expect\n",
      "hoped to tell\n",
      "refusing to make\n",
      "intended to stop\n",
      "failed to lead\n",
      "need to discipline\n",
      "attempts to trace\n",
      "conspire to defy\n",
      "learning to think\n",
      "wants to know\n",
      "wants to supply\n",
      "begin to look\n",
      "start to think\n",
      "attempt to say\n",
      "come to feel\n",
      "supposed to put\n",
      "called to work\n",
      "continue to exist\n",
      "observed to characterize\n",
      "continue to alienate\n",
      "continue to preach\n",
      "means to say\n",
      "fit to place\n",
      "concerned to stand\n",
      "strive to formulate\n",
      "proceeded to give\n",
      "offer to remind\n",
      "offered to allow\n",
      "requested to teach\n",
      "said to repeat\n",
      "mean to say\n",
      "inclined to extenuate\n",
      "came to rescue\n",
      "venture to assert\n",
      "come to destroy\n",
      "compelled to ask\n",
      "begins to look\n",
      "refuse to accept\n",
      "entitled to excoriate\n",
      "come to occupy\n",
      "prepared to resort\n",
      "obliged to become\n",
      "disposed to allow\n",
      "prepared to give\n",
      "trying to continue\n",
      "continue to use\n",
      "attempting to bridge\n",
      "destined to live\n",
      "daring to trust\n",
      "called to stand\n",
      "die to save\n",
      "told to express\n",
      "supposed to perform\n",
      "designed to give\n",
      "fear to negotiate\n",
      "threatening to devour\n",
      "try to escape\n",
      "tried to swim\n",
      "learn to say\n",
      "threatening to eat\n",
      "remains to show\n",
      "attempted to analyze\n",
      "tried to consider\n",
      "begin to talk\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "tended to stifle\n",
      "begin to understand\n",
      "fail to achieve\n",
      "made to keep\n",
      "desiring to unite\n",
      "invited to speak\n",
      "hesitate to ask\n",
      "trying to make\n",
      "help to determine\n",
      "combine to provide\n",
      "attempt to compensate\n",
      "learn to recognize\n",
      "serve to promote\n",
      "claim to incarnate\n",
      "led to emphasize\n",
      "tend to consider\n",
      "expected to seek\n",
      "disposed to compromise\n",
      "served to provide\n",
      "mean to imply\n",
      "mean to imply\n",
      "attempts to face\n",
      "need to submit\n",
      "prepared to run\n",
      "asked to choose\n",
      "continuing to incur\n",
      "seems to think\n",
      "begin to amass\n",
      "sought to limit\n",
      "bring to bear\n",
      "invited to participate\n",
      "sought to bring\n",
      "attempting to explore\n",
      "seen to consist\n",
      "committed to avoid\n",
      "claim to serve\n",
      "determined to avoid\n",
      "trying to converse\n",
      "started to adjust\n",
      "trying to make\n",
      "decided to take\n",
      "forced to conclude\n",
      "beginning to make\n",
      "helped to make\n",
      "made to give\n",
      "determined to exclude\n",
      "sought to win\n",
      "sought to avoid\n",
      "meant to incur\n",
      "supposed to result\n",
      "cited to show\n",
      "supposed to possess\n",
      "burned to make\n",
      "wanted to find\n",
      "helps to meet\n",
      "rejoiced to see\n",
      "began to suspect\n",
      "began to review\n",
      "called to sit\n",
      "began to write\n",
      "decided to try\n",
      "takes to tell\n",
      "seemed to widen\n",
      "proceeded to teach\n",
      "helps to make\n",
      "remember to make\n",
      "supposed to like\n",
      "working to improve\n",
      "like to make\n",
      "added to encourage\n",
      "like to shear\n",
      "needs to tell\n",
      "like to grow\n",
      "allowed to mature\n",
      "used to attack\n",
      "continued to threaten\n",
      "decide to build\n",
      "used to destroy\n",
      "going to develop\n",
      "put to see\n",
      "fail to develop\n",
      "seem to fall\n",
      "serve to emphasize\n",
      "tend to stamp\n",
      "fail to enter\n",
      "rehearing to acquire\n",
      "fail to convey\n",
      "needed to attain\n",
      "seem to reduce\n",
      "continue to show\n",
      "sponsored to win\n",
      "invited to judge\n",
      "asked to pick\n",
      "qualified to judge\n",
      "helping to create\n",
      "qualified to win\n",
      "continuing to donate\n",
      "found to take\n",
      "built to accommodate\n",
      "bothered to make\n",
      "wanted to purchase\n",
      "managing to get\n",
      "formed to develop\n",
      "used to indicate\n",
      "meant to pertain\n",
      "designed to cater\n",
      "equipped to handle\n",
      "pulled to clear\n",
      "Tend to make\n",
      "progresses to insure\n",
      "Endeavor to get\n",
      "used to separate\n",
      "used to separate\n",
      "seems to know\n",
      "wanted to trot\n",
      "likes to trot\n",
      "wants to trot\n",
      "started to pace\n",
      "starting to go\n",
      "expected to race\n",
      "designed to push\n",
      "looks to run\n",
      "began to motor\n",
      "trained to drag\n",
      "fled to make\n",
      "seemed to know\n",
      "used to say\n",
      "preferred to get\n",
      "hope to cover\n",
      "want to miss\n",
      "scheduled to vanish\n",
      "vanish to make\n",
      "continued to live\n",
      "seem to cascade\n",
      "forget to buy\n",
      "fail to shorten\n",
      "intend to cook\n",
      "sized to fit\n",
      "continue to release\n",
      "wish to create\n",
      "trim to fit\n",
      "cut to fit\n",
      "help to prevent\n",
      "designed to take\n",
      "used to transport\n",
      "want to buy\n",
      "used to fasten\n",
      "help to keep\n",
      "needed to build\n",
      "designed to accommodate\n",
      "adjusted to suit\n",
      "used to cut\n",
      "want to avoid\n",
      "agreed to take\n",
      "planned to destroy\n",
      "allowed to issue\n",
      "managed to coerce\n",
      "want to know\n",
      "planning to bring\n",
      "urged to keep\n",
      "come to swim\n",
      "enjoined to look\n",
      "prepared to cope\n",
      "want to make\n",
      "allowed to dry\n",
      "pays to buy\n",
      "want to play\n",
      "expected to last\n",
      "plan to add\n",
      "want to start\n",
      "plan to buy\n",
      "going to need\n",
      "continue to reduce\n",
      "needed to arrive\n",
      "done to correct\n",
      "cost to make\n",
      "settled to find\n",
      "grew to fulfill\n",
      "attempted to restrict\n",
      "conceived to affirm\n",
      "prefer to believe\n",
      "tried to refashion\n",
      "begin to fear\n",
      "linger to haunt\n",
      "disciplined to serve\n",
      "trained to fulfill\n",
      "organized to furnish\n",
      "continued to paint\n",
      "made to weave\n",
      "try to place\n",
      "hesitate to add\n",
      "seemed to emphasize\n",
      "mean to project\n",
      "wishes to convey\n",
      "beginning to learn\n",
      "start to study\n",
      "said to start\n",
      "wished to get\n",
      "Try to push\n",
      "taken to see\n",
      "promises to open\n",
      "selected to operate\n",
      "used to measure\n",
      "employed to measure\n",
      "used to detect\n",
      "tend to reflect\n",
      "used to scan\n",
      "decided to enter\n",
      "preparing to matriculate\n",
      "continued to help\n",
      "intend to carry\n",
      "lived to see\n",
      "manage to experiment\n",
      "tempted to compare\n",
      "made to see\n",
      "caused to glow\n",
      "made to flow\n",
      "happened to place\n",
      "used to construct\n",
      "used to fill\n",
      "examine to make\n",
      "designed to counter\n",
      "tend to become\n",
      "try to share\n",
      "continue to make\n",
      "come to expect\n",
      "used to keep\n",
      "bound to increase\n",
      "trying to match\n",
      "going to take\n",
      "continue to exceed\n",
      "extended to compare\n",
      "continue to divorce\n",
      "fail to lower\n",
      "supposed to stand\n",
      "prepared to teach\n",
      "school to cover\n",
      "make to assess\n",
      "try to set\n",
      "encouraged to take\n",
      "try to maintain\n",
      "plan to limit\n",
      "make to assure\n",
      "afford to spend\n",
      "Aim to balance\n",
      "Check to see\n",
      "called to determine\n",
      "cooperate to launch\n",
      "designed to expose\n",
      "existing to acquaint\n",
      "like to organize\n",
      "begin to appreciate\n",
      "inclined to think\n",
      "needed to protect\n",
      "struggling to meet\n",
      "helping to account\n",
      "want to learn\n",
      "used to think\n",
      "fights to change\n",
      "tends to rise\n",
      "expects to extend\n",
      "learn to wear\n",
      "tried to make\n",
      "appears to lie\n",
      "attempted to provide\n",
      "found to allow\n",
      "planned to duplicate\n",
      "wants to interest\n",
      "want to risk\n",
      "want to use\n",
      "continue to learn\n",
      "meant to convey\n",
      "used to minimize\n",
      "try to wrestle\n",
      "trying to install\n",
      "plan to build\n",
      "equipped to handle\n",
      "equipped to package\n",
      "equipped to receive\n",
      "equipped to save\n",
      "plan to increase\n",
      "hopes to cut\n",
      "bound to swell\n",
      "begin to feel\n",
      "want to change\n",
      "arrange to rent\n",
      "plan to travel\n",
      "plan to visit\n",
      "like to start\n",
      "wish to budget\n",
      "wanting to rent\n",
      "want to see\n",
      "want to throw\n",
      "designed to work\n",
      "trying to prepare\n",
      "began to develop\n",
      "used to suggest\n",
      "wanted to polish\n",
      "pays to consider\n",
      "compelled to use\n",
      "began to fall\n",
      "begun to write\n",
      "made to seem\n",
      "attempting to direct\n",
      "pleased to call\n",
      "scheduled to nominate\n",
      "come to spend\n",
      "managed to irrigate\n",
      "stooped to scoop\n",
      "fall to show\n",
      "try to push\n",
      "begins to deteriorate\n",
      "used to like\n",
      "offered to ship\n",
      "hopes to find\n",
      "invented to hold\n",
      "learn to like\n",
      "labored to set\n",
      "set to receive\n",
      "entered to compete\n",
      "seem to make\n",
      "seemed to answer\n",
      "decided to use\n",
      "began to show\n",
      "Wishing to show\n",
      "learned to set\n",
      "forced to fly\n",
      "hope to break\n",
      "came to recognize\n",
      "turning to cup\n",
      "seems to creep\n",
      "going to live\n",
      "got to learn\n",
      "learn to live\n",
      "going to live\n",
      "like to sew\n",
      "love to run\n",
      "love to crack\n",
      "yearn to make\n",
      "tried to see\n",
      "love to dust\n",
      "like to become\n",
      "decide to write\n",
      "cause to exist\n",
      "learn to portray\n",
      "learn to portray\n",
      "began to advise\n",
      "taught to yield\n",
      "prefer to cope\n",
      "helps to explain\n",
      "surprised to bump\n",
      "seemed to brave\n",
      "begins to regard\n",
      "began to embezzle\n",
      "appears to endorse\n",
      "expected to like\n",
      "begin to assert\n",
      "began to challenge\n",
      "going to become\n",
      "helping to make\n",
      "began to stress\n",
      "began to describe\n",
      "fails to gain\n",
      "liked to play\n",
      "love to audition\n",
      "wanted to show\n",
      "like to see\n",
      "loved to dance\n",
      "try to bid\n",
      "wanted to go\n",
      "asked to leave\n",
      "continued to promote\n",
      "wished to meet\n",
      "hoping to see\n",
      "got to know\n",
      "paused to comfort\n",
      "hesitate to quote\n",
      "decided to see\n",
      "wanted to take\n",
      "need to know\n",
      "need to look\n",
      "beginning to protrude\n",
      "try to speak\n",
      "decides to proceed\n",
      "interested to hear\n",
      "seems to probe\n",
      "preferring to consider\n",
      "known to go\n",
      "amazed to realize\n",
      "seeking to help\n",
      "interpreted to conform\n",
      "explored to find\n",
      "trying to throw\n",
      "designed to find\n",
      "required to mark\n",
      "asked to consider\n",
      "seem to involve\n",
      "seems to smell\n",
      "seems to see\n",
      "learned to develop\n",
      "arranged to meet\n",
      "need to work\n",
      "want to raise\n",
      "need to bring\n",
      "expect to grow\n",
      "expected to work\n",
      "want to include\n",
      "going to produce\n",
      "want to hire\n",
      "want to buy\n",
      "want to hire\n",
      "going to farm\n",
      "need to know\n",
      "want to undertake\n",
      "want to buy\n",
      "wish to locate\n",
      "plan to sell\n",
      "want to go\n",
      "intend to raise\n",
      "cost to live\n",
      "expected to produce\n",
      "expect to get\n",
      "forced to lay\n",
      "trying to explain\n",
      "happened to light\n",
      "began to turn\n",
      "intended to warn\n",
      "used to transform\n",
      "forced to overcome\n",
      "begins to give\n",
      "failed to post\n",
      "refused to permit\n",
      "encouraged to beget\n",
      "obliged to obey\n",
      "united to push\n",
      "try to oppose\n",
      "made to impose\n",
      "wanted to clarify\n",
      "proposed to sail\n",
      "determined to catch\n",
      "forced to turn\n",
      "seemed to sense\n",
      "seemed to know\n",
      "tried to brush\n",
      "turning to repeat\n",
      "tried to persuade\n",
      "wanted to turn\n",
      "preparing to pacify\n",
      "forced to retreat\n",
      "contracted to supply\n",
      "forced to leave\n",
      "offering to bring\n",
      "attempt to bring\n",
      "decided to cast\n",
      "liked to tease\n",
      "going to buy\n",
      "com to sea\n",
      "drilled to follow\n",
      "born to command\n",
      "come to recognize\n",
      "allowed to account\n",
      "created to fan\n",
      "come to mean\n",
      "trying to make\n",
      "refusing to keep\n",
      "wishes to discuss\n",
      "want to ask\n",
      "want to tap\n",
      "said to use\n",
      "employed to see\n",
      "shoot to kill\n",
      "refused to touch\n",
      "threatened to shoot\n",
      "said to let\n",
      "begin to roll\n",
      "held to assure\n",
      "going to make\n",
      "managed to get\n",
      "wanted to play\n",
      "prepared to counterattack\n",
      "failed to rally\n",
      "tried to rape\n",
      "refused to speak\n",
      "called to look\n",
      "refused to say\n",
      "mean to suggest\n",
      "prepared to carry\n",
      "designed to overthrow\n",
      "trying to put\n",
      "needed to work\n",
      "disposed to exploit\n",
      "fail to see\n",
      "bound to fall\n",
      "tempted to place\n",
      "need to ask\n",
      "seek to undermine\n",
      "hand to show\n",
      "begun to spit\n",
      "threatened to ignite\n",
      "invited to take\n",
      "rushing to keep\n",
      "like to wander\n",
      "like to follow\n",
      "professing to believe\n",
      "want to show\n",
      "enabled to attend\n",
      "determined to exercise\n",
      "inclined to exaggerate\n",
      "like to go\n",
      "determined to marry\n",
      "said to sprinkle\n",
      "used to stop\n",
      "bought to apply\n",
      "supposed to cause\n",
      "said to give\n",
      "allowed to rest\n",
      "enters to spoil\n",
      "wish to deny\n",
      "allowed to warm\n",
      "wishes to entertain\n",
      "allowed to stand\n",
      "refused to accept\n",
      "wished to continue\n",
      "persuaded to accept\n",
      "decided to charge\n",
      "decided to go\n",
      "allowed to see\n",
      "agreed to take\n",
      "decide to send\n",
      "allowed to delay\n",
      "request to leave\n",
      "promised to treat\n",
      "declined to enter\n",
      "added to reinforce\n",
      "obliged to publish\n",
      "continue to serve\n",
      "plans to serve\n",
      "Hoping to cut\n",
      "obliged to announce\n",
      "wish to preserve\n",
      "heard to remark\n",
      "hopes to redress\n",
      "desires to walk\n",
      "prefer to take\n",
      "likes to measure\n",
      "proposed to corral\n",
      "intended to stay\n",
      "ceased to look\n",
      "manages to overlook\n",
      "troubled to read\n",
      "destined to go\n",
      "expected to go\n",
      "used to characterize\n",
      "helping to raise\n",
      "decided to stay\n",
      "used to refer\n",
      "needs to educate\n",
      "tended to tamp\n",
      "like to underline\n",
      "begun to falter\n",
      "intend to include\n",
      "wish to improve\n",
      "try to take\n",
      "prefers to designate\n",
      "want to join\n",
      "seeking to increase\n",
      "used to make\n",
      "used to make\n",
      "inclined to remain\n",
      "heard to say\n",
      "stopped to receive\n",
      "used to describe\n",
      "claimed to own\n",
      "tried to find\n",
      "meant to pay\n",
      "given to go\n",
      "wanted to make\n",
      "began to gallop\n",
      "attempting to lasso\n",
      "failing to encircle\n",
      "got to get\n",
      "trying to maneuver\n",
      "beginning to go\n",
      "began to pull\n",
      "began to draw\n",
      "like to go\n",
      "tend to compete\n",
      "doing to help\n",
      "begins to see\n",
      "Desiring to fill\n",
      "tends to look\n",
      "try to match\n",
      "played to win\n",
      "failed to make\n",
      "began to involve\n",
      "learning to bunt\n",
      "dared to dream\n",
      "dared to taunt\n",
      "refused to come\n",
      "undertook to set\n",
      "essayed to down\n",
      "began to prosper\n",
      "liked to wring\n",
      "happened to sit\n",
      "hastened to place\n",
      "began to offer\n",
      "seemed to indicate\n",
      "liked to imagine\n",
      "expected to know\n",
      "began to appear\n",
      "begin to store\n",
      "continue to sanction\n",
      "intended to demonstrate\n",
      "permitted to exercise\n",
      "encouraged to develop\n",
      "failing to behave\n",
      "appeared to regard\n",
      "seek to disprove\n",
      "tends to fuse\n",
      "prefers to adduce\n",
      "empowered to compel\n",
      "designed to prevent\n",
      "disposed to heed\n",
      "agree to let\n",
      "seeking to reform\n",
      "used to crowd\n",
      "Ask to see\n",
      "interested to learn\n",
      "pass to add\n",
      "demanding to know\n",
      "seems to threaten\n",
      "tried to describe\n",
      "tried to explain\n",
      "seem to feel\n",
      "got to play\n",
      "ceased to need\n",
      "like to live\n",
      "came to see\n",
      "threatens to break\n",
      "begins to fade\n",
      "begins to appear\n",
      "equipped to tell\n",
      "used to increase\n",
      "hired to repeat\n",
      "wished to make\n",
      "seems to exist\n",
      "means to choose\n",
      "struggle to insulate\n",
      "serves to crystallize\n",
      "doomed to become\n",
      "serves to illuminate\n",
      "failed to furnish\n",
      "encouraged to trade\n",
      "continued to come\n",
      "promised to send\n",
      "attempted to understand\n",
      "decided to send\n",
      "assigned to arrest\n",
      "planned to build\n",
      "offered to surrender\n",
      "gone to live\n",
      "returned to succeed\n",
      "expected to arrange\n",
      "expected to supply\n",
      "expected to entertain\n",
      "tried to bring\n",
      "provoked to use\n",
      "refused to let\n",
      "needed to outwit\n",
      "purporting to inform\n",
      "inspired to remind\n",
      "mean to tell\n",
      "trying to demonstrate\n",
      "went to visit\n",
      "continued to teach\n",
      "beginning to devise\n",
      "learn to like\n",
      "stood to watch\n",
      "planned to go\n",
      "trying to plan\n",
      "continues to grow\n",
      "learn to keep\n",
      "learned to polish\n",
      "left to meet\n",
      "fails to make\n",
      "resolved to maintain\n",
      "register to vote\n",
      "needs to make\n",
      "going to march\n",
      "proposed to defeat\n",
      "proposed to enter\n",
      "seems to require\n",
      "seem to violate\n",
      "tended to obscure\n",
      "continue to view\n",
      "try to coerce\n",
      "likes to believe\n",
      "continue to affect\n",
      "served to overcome\n",
      "tends to further\n",
      "help to reveal\n",
      "struggle to assert\n",
      "said to exist\n",
      "taken to guard\n",
      "done to increase\n",
      "ready to tick\n",
      "forced to hypothesize\n",
      "used to challenge\n",
      "permitted to authorize\n",
      "decides to break\n",
      "required to pass\n",
      "decide to clobber\n",
      "decided to reverse\n",
      "tried to start\n",
      "forbidden to fly\n",
      "required to copy\n",
      "began to move\n",
      "run to live\n",
      "started to glance\n",
      "try to memorize\n",
      "turned to look\n",
      "trying to talk\n",
      "started to decline\n",
      "continues to take\n",
      "continues to center\n",
      "come to see\n",
      "come to walk\n",
      "beginning to complain\n",
      "gather to sing\n",
      "began to converse\n",
      "began to relax\n",
      "hoped to become\n",
      "forced to restrict\n",
      "began to give\n",
      "asked to become\n",
      "trying to sell\n",
      "serves to stimulate\n",
      "seemed to lack\n",
      "offered to make\n",
      "assembled to warrant\n",
      "returned to preside\n",
      "sought to prevent\n",
      "expect to stand\n",
      "compelled to face\n",
      "continue to live\n",
      "refused to move\n",
      "refused to obey\n",
      "doomed to become\n",
      "tended to romanticize\n",
      "supposed to keep\n",
      "left to rest\n",
      "wants to see\n",
      "tended to dress\n",
      "designed to become\n",
      "begins to feel\n",
      "tends to depict\n",
      "transferred to become\n",
      "impelled to make\n",
      "seeks to make\n",
      "made to look\n",
      "happen to meet\n",
      "told to lie\n",
      "wanted to write\n",
      "tempted to say\n",
      "omitting to assert\n",
      "continue to live\n",
      "refused to permit\n",
      "served to maintain\n",
      "seem to make\n",
      "help to dispel\n",
      "trained to describe\n",
      "daring to abandon\n",
      "seem to resemble\n",
      "appears to lie\n",
      "tend to persist\n",
      "tried to describe\n",
      "like to call\n",
      "began to speak\n",
      "try to say\n",
      "attempting to make\n",
      "attempt to answer\n",
      "wanted to know\n",
      "designed to enhance\n",
      "intended to provide\n",
      "continue to suffer\n",
      "serves to make\n",
      "fails to reach\n",
      "beginning to crack\n",
      "drawn to join\n",
      "made to bite\n",
      "forbidden to swing\n",
      "seemed to hear\n",
      "hired to drive\n",
      "try to work\n",
      "forbidden to love\n",
      "made to represent\n",
      "starts to ride\n",
      "tries to stop\n",
      "begins to gather\n",
      "brought to pass\n",
      "tends to reflect\n",
      "tended to stratify\n",
      "chosen to use\n",
      "used to mean\n",
      "forced to respond\n",
      "tends to lose\n",
      "tends to express\n",
      "made to integrate\n",
      "try to get\n",
      "attempted to restrain\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "wished to continue\n",
      "failed to flourish\n",
      "propose to go\n",
      "wished to segregate\n",
      "liked to fancy\n",
      "Deciding to become\n",
      "strove to see\n",
      "used to play\n",
      "returned to live\n",
      "proceeded to find\n",
      "likes to catch\n",
      "seems to care\n",
      "intends to save\n",
      "compelled to find\n",
      "wishes to continue\n",
      "ceasing to write\n",
      "stops to ask\n",
      "expected to fulfill\n",
      "tailored to meet\n",
      "want to say\n",
      "want to quote\n",
      "seems to realize\n",
      "primed to catch\n",
      "try to diagnose\n",
      "want to point\n",
      "used to regard\n",
      "seems to represent\n",
      "trying to draw\n",
      "wish to see\n",
      "used to include\n",
      "allowed to operate\n",
      "urged to produce\n",
      "afford to present\n",
      "decides to drop\n",
      "expect to abolish\n",
      "needed to pit\n",
      "tempted to blame\n",
      "hope to serve\n",
      "tried to remedy\n",
      "tends to express\n",
      "seem to believe\n",
      "permitted to return\n",
      "attempted to make\n",
      "prepared to demonstrate\n",
      "calculated to suggest\n",
      "seemed to disconcert\n",
      "known to make\n",
      "going to talk\n",
      "learns to focus\n",
      "chooses to subordinate\n",
      "wish to preserve\n",
      "cease to exist\n",
      "seem to constitute\n",
      "destined to fail\n",
      "wants to get\n",
      "began to understand\n",
      "wanted to capture\n",
      "liked to tell\n",
      "decided to migrate\n",
      "continued to trouble\n",
      "labored to finish\n",
      "decided to return\n",
      "waiting to go\n",
      "chosen to serve\n",
      "came to know\n",
      "helped to escape\n",
      "opened to admit\n",
      "happened to see\n",
      "brought to bear\n",
      "inclined to argue\n",
      "seeming to say\n",
      "prompted to write\n",
      "come to dominate\n",
      "used to illustrate\n",
      "prepared to find\n",
      "wish to argue\n",
      "begin to read\n",
      "plan to discuss\n",
      "come to call\n",
      "expect to find\n",
      "come to believe\n",
      "continue to pay\n",
      "tend to thump\n",
      "determined to prove\n",
      "learn to control\n",
      "used to frustrate\n",
      "trying to assert\n",
      "trying to expose\n",
      "comes to regard\n",
      "felt to indicate\n",
      "came to speak\n",
      "needed to explain\n",
      "required to make\n",
      "sought to make\n",
      "accustomed to think\n",
      "come to look\n",
      "undertook to give\n",
      "came to study\n",
      "bound to go\n",
      "tried to dazzle\n",
      "got to know\n",
      "presumed to address\n",
      "obliged to defend\n",
      "coming to spend\n",
      "learned to write\n",
      "obliged to send\n",
      "began to trail\n",
      "began to fly\n",
      "tried to calm\n",
      "inspired to complete\n",
      "began to talk\n",
      "compelled to spend\n",
      "expected to carry\n",
      "tend to make\n",
      "liked to think\n",
      "trying to emulate\n",
      "wanted to know\n",
      "seemed to remember\n",
      "asked to yield\n",
      "made to look\n",
      "begun to lose\n",
      "failed to learn\n",
      "wanted to take\n",
      "writing to devote\n",
      "vowed to kneel\n",
      "hoping to lift\n",
      "forced to seek\n",
      "continue to urge\n",
      "prepared to assist\n",
      "hope to make\n",
      "continue to maintain\n",
      "scheduled to go\n",
      "taken to program\n",
      "begun to probe\n",
      "attempting to present\n",
      "instructed to burn\n",
      "attempted to conclude\n",
      "equipped to handle\n",
      "trying to check\n",
      "mean to write\n",
      "wished to pursue\n",
      "refused to attend\n",
      "decided to dance\n",
      "failed to amaze\n",
      "continued to search\n",
      "threatening to swallow\n",
      "pleased to see\n",
      "tried to discover\n",
      "disturbed to find\n",
      "failed to realize\n",
      "manage to get\n",
      "wanted to buy\n",
      "decided to bypass\n",
      "allowed to preach\n",
      "allowed to pass\n",
      "dared to drop\n",
      "expected to move\n",
      "means to ridicule\n",
      "hesitate to sacrifice\n",
      "forced to move\n",
      "taken to effect\n",
      "hoped to imprint\n",
      "tailored to fit\n",
      "obliged to describe\n",
      "tried to block\n",
      "chosen to edit\n",
      "plotted to take\n",
      "tried to halt\n",
      "wanted to die\n",
      "returned to make\n",
      "like to believe\n",
      "bother to look\n",
      "used to go\n",
      "seemed to thaw\n",
      "came to give\n",
      "wanted to see\n",
      "used to look\n",
      "meant to help\n",
      "like to straighten\n",
      "hope to give\n",
      "bark to let\n",
      "dash to get\n",
      "tried to talk\n",
      "decided to leave\n",
      "used to tell\n",
      "continue to reflect\n",
      "appear to preach\n",
      "intend to let\n",
      "need to test\n",
      "learned to meet\n",
      "said to give\n",
      "serves to reduce\n",
      "thought to provide\n",
      "tends to give\n",
      "wish to deny\n",
      "expect to find\n",
      "seek to capture\n",
      "allowed to claim\n",
      "seeks to recapture\n",
      "determined to bulldoze\n",
      "sought to run\n",
      "needed to make\n",
      "hurry to catch\n",
      "planned to bolt\n",
      "fit to nominate\n",
      "intend to support\n",
      "refusing to abandon\n",
      "begun to parallel\n",
      "help to give\n",
      "fail to convey\n",
      "tends to lose\n",
      "aimed to write\n",
      "granted to serve\n",
      "tends to underestimate\n",
      "permitted to cross\n",
      "demanding to know\n",
      "obliged to remain\n",
      "delighted to make\n",
      "seem to shake\n",
      "assigned to check\n",
      "volunteered to advance\n",
      "went to hurry\n",
      "refused to notice\n",
      "began to select\n",
      "began to specify\n",
      "failed to work\n",
      "care to come\n",
      "helped to deepen\n",
      "come to say\n",
      "fitted to live\n",
      "stoop to argue\n",
      "obliged to insist\n",
      "managed to annex\n",
      "going to prove\n",
      "preparing to test\n",
      "came to know\n",
      "got to know\n",
      "persuaded to lend\n",
      "expected to report\n",
      "began to experience\n",
      "attempted to get\n",
      "happened to catch\n",
      "chanced to soil\n",
      "begins to besiege\n",
      "beginning to attract\n",
      "come to learn\n",
      "serve to lead\n",
      "try to get\n",
      "longing to see\n",
      "long to see\n",
      "trying to promote\n",
      "beginning to fill\n",
      "wants to linger\n",
      "chiseled to match\n",
      "trying to track\n",
      "determined to get\n",
      "began to develop\n",
      "continued to grow\n",
      "decided to capitalize\n",
      "came to favor\n",
      "used to describe\n",
      "began to play\n",
      "gathered to hear\n",
      "guaranteed to excite\n",
      "invited to deliver\n",
      "sent to knoe\n",
      "preparing to deport\n",
      "told to leave\n",
      "constrained to move\n",
      "refused to let\n",
      "managed to get\n",
      "trying to get\n",
      "tending to arouse\n",
      "sent to get\n",
      "tried to arbitrate\n",
      "tried to arbitrate\n",
      "ordered to knock\n",
      "refused to attend\n",
      "determined to compel\n",
      "refused to sanction\n",
      "going to let\n",
      "attempt to prorate\n",
      "leaving to come\n",
      "please to write\n",
      "want to go\n",
      "want to teach\n",
      "wanted to go\n",
      "tried to picture\n",
      "waiting to hear\n",
      "came to live\n",
      "began to show\n",
      "tends to weaken\n",
      "seems to rise\n",
      "permitted to see\n",
      "continues to discuss\n",
      "serve to sublimate\n",
      "wanted to close\n",
      "wished to keep\n",
      "want to describe\n",
      "began to denounce\n",
      "afford to place\n",
      "try to fit\n",
      "decides to enter\n",
      "expected to prefer\n",
      "tend to bring\n",
      "tend to become\n",
      "tend to assimilate\n",
      "tend to converge\n",
      "disposed to question\n",
      "forced to realize\n",
      "assembled to bear\n",
      "beginning to tell\n",
      "hastened to dispatch\n",
      "ordered to attack\n",
      "going to trouble\n",
      "wanted to borrow\n",
      "trying to pick\n",
      "helping to prevent\n",
      "preferred to sell\n",
      "think to take\n",
      "ordered to approach\n",
      "prepared to move\n",
      "come to pay\n",
      "refused to grant\n",
      "want to offend\n",
      "seeming to invalidate\n",
      "want to drive\n",
      "left to resist\n",
      "tempted to consider\n",
      "empowered to swear\n",
      "allowed to appoint\n",
      "wanted to invest\n",
      "decided to stay\n",
      "live to see\n",
      "began to put\n",
      "decided to leave\n",
      "wanted to leave\n",
      "want to see\n",
      "come to say\n",
      "began to move\n",
      "went to visit\n",
      "got to drink\n",
      "seem to know\n",
      "wanted to help\n",
      "seem to fall\n",
      "tends to obscure\n",
      "beginning to point\n",
      "trying to prove\n",
      "trying to sort\n",
      "Start to prepare\n",
      "obliged to go\n",
      "declined to introduce\n",
      "enter to ask\n",
      "seems to lie\n",
      "continued to shape\n",
      "seem to pass\n",
      "prepared to accept\n",
      "done to obtaine\n",
      "expected to reach\n",
      "seems to refer\n",
      "tried to consult\n",
      "came to put\n",
      "seemed to promise\n",
      "needed to possess\n",
      "seem to indicate\n",
      "purports to examine\n",
      "attempts to understand\n",
      "tend to disprove\n",
      "forced to admit\n",
      "attempt to ascertain\n",
      "forced to demonstrate\n",
      "sought to maintain\n",
      "determined to resist\n",
      "compelled to make\n",
      "threatening to murder\n",
      "agreed to see\n",
      "learned to know\n",
      "written to say\n",
      "came to see\n",
      "liked to think\n",
      "chosen to follow\n",
      "went to see\n",
      "forced to depict\n",
      "expect to find\n",
      "hoped to persuade\n",
      "decided to go\n",
      "compelled to spend\n",
      "indisposed to appear\n",
      "try to keep\n",
      "arrived to see\n",
      "try to keep\n",
      "made to write\n",
      "training to keep\n",
      "decided to give\n",
      "wanted to apologize\n",
      "began to cry\n",
      "going to make\n",
      "forced to learn\n",
      "required to absorb\n",
      "learned to write\n",
      "learned to dispute\n",
      "learned to dispute\n",
      "ceased to exist\n",
      "inclined to inquire\n",
      "like to say\n",
      "permitted to write\n",
      "wait to see\n",
      "choose to fill\n",
      "served to confirm\n",
      "like to suggest\n",
      "wanted to know\n",
      "expected to happen\n",
      "asked to join\n",
      "seem to regard\n",
      "inclined to say\n",
      "cease to haunt\n",
      "wishes to express\n",
      "continue to bridge\n",
      "struggle to keep\n",
      "begin to look\n",
      "began to feel\n",
      "begins to doubt\n",
      "seemed to survive\n",
      "begins to dream\n",
      "refuses to surrender\n",
      "began to discover\n",
      "decided to seek\n",
      "seek to eliminate\n",
      "organized to deal\n",
      "expected to consist\n",
      "beginning to use\n",
      "tried to enter\n",
      "forced to play\n",
      "want to quibble\n",
      "used to make\n",
      "love to suffer\n",
      "love to suffer\n",
      "came to believe\n",
      "trying to outdo\n",
      "used to say\n",
      "castigates to liberate\n",
      "helped to educate\n",
      "expect to find\n",
      "supposed to supplant\n",
      "wanted to write\n",
      "asked to see\n",
      "planned to lay\n",
      "wanted to put\n",
      "decide to disown\n",
      "wanted to pay\n",
      "known to make\n",
      "trying to prove\n",
      "required to meet\n",
      "designed to improve\n",
      "designed to assist\n",
      "wish to buy\n",
      "made to establish\n",
      "required to carry\n",
      "established to provide\n",
      "desire to explore\n",
      "required to own\n",
      "required to attain\n",
      "decide to support\n",
      "prepared to depart\n",
      "designed to provide\n",
      "designed to raise\n",
      "designed to prevent\n",
      "aimed to attract\n",
      "like to press\n",
      "take to show\n",
      "designed to prevent\n",
      "persuaded to take\n",
      "induced to establish\n",
      "persuaded to adopt\n",
      "persuaded to adopt\n",
      "prepared to give\n",
      "prepared to enter\n",
      "dedicated to secure\n",
      "like to think\n",
      "like to think\n",
      "afford to lose\n",
      "continues to add\n",
      "helping to pilot\n",
      "prefer to speak\n",
      "go to discuss\n",
      "made to replace\n",
      "continuing to seek\n",
      "seem to add\n",
      "seem to fix\n",
      "known to tax\n",
      "like to see\n",
      "continued to run\n",
      "voted to continue\n",
      "entitled to benefit\n",
      "needed to establish\n",
      "designed to give\n",
      "remain to preserve\n",
      "gathered to thank\n",
      "continue to protect\n",
      "amended to read\n",
      "construed to alter\n",
      "required to correlate\n",
      "amended to read\n",
      "directed to make\n",
      "directed to establish\n",
      "continued to display\n",
      "required to move\n",
      "planned to furnish\n",
      "agreed to submit\n",
      "initiated to resolve\n",
      "found to exist\n",
      "taken to isolate\n",
      "modified to reduce\n",
      "tending to separate\n",
      "established to gather\n",
      "used to study\n",
      "used to measure\n",
      "used to calculate\n",
      "directed to mail\n",
      "offers to pay\n",
      "promises to pay\n",
      "construed to limit\n",
      "directed to pay\n",
      "directed to cover\n",
      "failed to offer\n",
      "intends to pursue\n",
      "helping to create\n",
      "wish to merge\n",
      "pleased to note\n",
      "continue to serve\n",
      "pleased to note\n",
      "inclined to drag\n",
      "trying to get\n",
      "made to enlist\n",
      "try to run\n",
      "designed to help\n",
      "designed to reflect\n",
      "designed to avoid\n",
      "designed to reflect\n",
      "required to help\n",
      "working to develop\n",
      "installed to increase\n",
      "prepared to stay\n",
      "used to keep\n",
      "came to receive\n",
      "tend to create\n",
      "attempting to bring\n",
      "designed to arrest\n",
      "attempt to monopolize\n",
      "held to appoint\n",
      "prepared to submit\n",
      "allowed to petition\n",
      "ordered to terminate\n",
      "required to pass\n",
      "required to pass\n",
      "permitted to endanger\n",
      "compelled to testify\n",
      "permitted to rebut\n",
      "failed to show\n",
      "permitted to rebut\n",
      "refused to require\n",
      "ordered to report\n",
      "ordered to report\n",
      "fail to see\n",
      "sought to secure\n",
      "failed to show\n",
      "entitled to inspect\n",
      "hopes to find\n",
      "like to make\n",
      "found to enable\n",
      "need to concern\n",
      "fail to bring\n",
      "fail to act\n",
      "want to stimulate\n",
      "want to make\n",
      "tended to ignore\n",
      "expected to take\n",
      "expected to know\n",
      "expected to supervise\n",
      "begins to go\n",
      "moved to think\n",
      "beginning to box\n",
      "surprised to find\n",
      "hope to win\n",
      "began to talk\n",
      "begins to take\n",
      "decided to make\n",
      "asked to give\n",
      "formed to give\n",
      "taken to link\n",
      "put to use\n",
      "use to pay\n",
      "going to work\n",
      "combine to provide\n",
      "wish to serve\n",
      "expected to increase\n",
      "needed to maintain\n",
      "needed to obtain\n",
      "planned to maintain\n",
      "needed to meet\n",
      "proposed to authorize\n",
      "decided to stop\n",
      "scheduled to become\n",
      "seek to assure\n",
      "agrees to furnish\n",
      "prepared to consider\n",
      "prepared to act\n",
      "prepared to act\n",
      "required to cease\n",
      "required to operate\n",
      "designed to operate\n",
      "permitted to operate\n",
      "taken to minimize\n",
      "permitted to operate\n",
      "permitted to operate\n",
      "permitted to operate\n",
      "required to operate\n",
      "required to afford\n",
      "elect to use\n",
      "required to file\n",
      "required to file\n",
      "elect to use\n",
      "required to file\n",
      "obligated to furnish\n",
      "trained to read\n",
      "made to assure\n",
      "tend to create\n",
      "rejoicing to remember\n",
      "permitted to run\n",
      "came to work\n",
      "decided to bring\n",
      "found to permit\n",
      "helping to strengthen\n",
      "began to ship\n",
      "believed to provide\n",
      "designed to provide\n",
      "expect to make\n",
      "developed to facilitate\n",
      "set to hold\n",
      "continuing to carry\n",
      "designed to increase\n",
      "improved to obtain\n",
      "purchased to permit\n",
      "extended to provide\n",
      "sought to meet\n",
      "designed to handle\n",
      "invited to participate\n",
      "planned to provide\n",
      "inclined to advance\n",
      "aims to give\n",
      "wish to pursue\n",
      "expected to increase\n",
      "expected to exceed\n",
      "begun to make\n",
      "continues to expand\n",
      "began to make\n",
      "need to learn\n",
      "learn to delegate\n",
      "working to attain\n",
      "begun to translate\n",
      "besieged to serve\n",
      "help to create\n",
      "assumed to originate\n",
      "used to describe\n",
      "expected to cause\n",
      "taken to study\n",
      "required to ensure\n",
      "used to measure\n",
      "used to start\n",
      "started to strike\n",
      "allowed to pull\n",
      "used to measure\n",
      "generalized to include\n",
      "eliminated to obtain\n",
      "extended to include\n",
      "used to derive\n",
      "adjusted to minimize\n",
      "required to make\n",
      "taken to prevent\n",
      "attempts to present\n",
      "evaporate to leave\n",
      "tend to stick\n",
      "helps to float\n",
      "acts to remove\n",
      "tend to accelerate\n",
      "appear to offer\n",
      "allowed to take\n",
      "allowed to distil\n",
      "undertaken to see\n",
      "allowed to stand\n",
      "thought to contribute\n",
      "made to characterize\n",
      "expect to find\n",
      "known to cause\n",
      "allowed to stand\n",
      "allowed to stand\n",
      "used to test\n",
      "allowed to clot\n",
      "need to make\n",
      "try to key\n",
      "manage to keep\n",
      "seem to prefer\n",
      "continues to add\n",
      "begin to play\n",
      "begin to appear\n",
      "begin to dig\n",
      "cease to lay\n",
      "manages to slip\n",
      "seem to recognize\n",
      "like to burrow\n",
      "like to think\n",
      "estimated to contain\n",
      "love to visit\n",
      "fail to show\n",
      "attempts to weigh\n",
      "given to complete\n",
      "required to reach\n",
      "prove to belong\n",
      "varied to allow\n",
      "noted to draw\n",
      "noted to occur\n",
      "permitted to speculate\n",
      "designed to stop\n",
      "failing to demonstrate\n",
      "failed to demonstrate\n",
      "applied to man\n",
      "begin to ossify\n",
      "seen to begin\n",
      "constructed to serve\n",
      "wishes to study\n",
      "attempted to simplify\n",
      "coupled to form\n",
      "appear to affect\n",
      "appear to act\n",
      "presumed to occur\n",
      "found to contain\n",
      "appears to result\n",
      "used to obtain\n",
      "like to re-emphasise\n",
      "adopted to make\n",
      "failed to change\n",
      "failed to show\n",
      "thought to represent\n",
      "failed to show\n",
      "attempting to improve\n",
      "allowed to react\n",
      "used to filter\n",
      "photographed to show\n",
      "thought to represent\n",
      "seems to follow\n",
      "known to contribute\n",
      "fail to elicit\n",
      "failed to evoke\n",
      "fail to eat\n",
      "trying to study\n",
      "try to study\n",
      "wish to show\n",
      "need to find\n",
      "like to give\n",
      "chosen to give\n",
      "need to know\n",
      "plans to go\n",
      "tossed to decide\n",
      "want to know\n",
      "want to study\n",
      "expect to face\n",
      "choose to derive\n",
      "seeking to become\n",
      "mobilized to achieve\n",
      "required to make\n",
      "work to realize\n",
      "seek to encourage\n",
      "prefer to live\n",
      "afford to wait\n",
      "begin to see\n",
      "committed to move\n",
      "continue to satisfy\n",
      "begun to develop\n",
      "programming to go\n",
      "fail to push\n",
      "attempt to communicate\n",
      "fitted to perform\n",
      "seeks to satisfy\n",
      "tends to integrate\n",
      "tends to support\n",
      "threatened to burst\n",
      "helped to understand\n",
      "combined to prevent\n",
      "needed to bolster\n",
      "helping to further\n",
      "seem to vary\n",
      "seem to act\n",
      "obliged to organize\n",
      "expected to show\n",
      "used to adjust\n",
      "tended to break\n",
      "delegated to cooperate\n",
      "expect to obtain\n",
      "planned to double\n",
      "began to plan\n",
      "attempted to design\n",
      "hastened to add\n",
      "seem to indicate\n",
      "decided to hold\n",
      "appear to drop\n",
      "get to take\n",
      "began to get\n",
      "began to meet\n",
      "increased to include\n",
      "chose to report\n",
      "expected to read\n",
      "expected to confront\n",
      "appeared to reach\n",
      "continued to give\n",
      "invoked to explain\n",
      "wanted to go\n",
      "mean to imply\n",
      "supposed to happen\n",
      "learning to read\n",
      "asked to describe\n",
      "learning to read\n",
      "expected to earn\n",
      "expected to earn\n",
      "surprised to find\n",
      "struggle to induce\n",
      "asked to learn\n",
      "prefer to test\n",
      "told to purchase\n",
      "seemed to antagonize\n",
      "designed to develop\n",
      "refused to change\n",
      "refused to change\n",
      "refused to accept\n",
      "supposed to know\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "working to become\n",
      "led to see\n",
      "asked to vote\n",
      "duplicated to form\n",
      "learn to play\n",
      "want to change\n",
      "learns to become\n",
      "began to emerge\n",
      "used to annoy\n",
      "stooping to dispense\n",
      "come to see\n",
      "preferred to keep\n",
      "used to give\n",
      "came to feel\n",
      "used to accomplish\n",
      "found to match\n",
      "required to store\n",
      "saved to represent\n",
      "saved to represent\n",
      "created to accommodate\n",
      "inspected to determine\n",
      "used to look\n",
      "serve to illustrate\n",
      "intended to decrease\n",
      "required to improve\n",
      "italicized to guide\n",
      "seems to center\n",
      "operate to center\n",
      "serves to focus\n",
      "purport to represent\n",
      "hesitates to suggest\n",
      "mentioned to make\n",
      "trying to develop\n",
      "compelled to omit\n",
      "continue to show\n",
      "planning to use\n",
      "expecting to recover\n",
      "meant to move\n",
      "preferred to continue\n",
      "trying to find\n",
      "planned to exterminate\n",
      "trying to marry\n",
      "pledged to hold\n",
      "determined to create\n",
      "seemed to assure\n",
      "attempted to marry\n",
      "obliged to concede\n",
      "expected to democratize\n",
      "Failing to heed\n",
      "determined to keep\n",
      "tend to procrastinate\n",
      "even to repudiate\n",
      "served to minimize\n",
      "encouraged to state\n",
      "trying to unearth\n",
      "decided to remove\n",
      "decide to encourage\n",
      "prefer to hire\n",
      "go to work\n",
      "intended to provide\n",
      "continues to stress\n",
      "encouraged to adopt\n",
      "motivated to take\n",
      "expected to respond\n",
      "training to meet\n",
      "used to pay\n",
      "taken to indicate\n",
      "afford to trade\n",
      "afford to lose\n",
      "taken to exemplify\n",
      "Try to imagine\n",
      "trying to outfox\n",
      "trying to get\n",
      "invited to try\n",
      "try to imagine\n",
      "begin to affect\n",
      "tend to move\n",
      "required to pay\n",
      "seek to force\n",
      "act to accentuate\n",
      "begin to edge\n",
      "move to restrain\n",
      "continue to press\n",
      "trying to win\n",
      "bound to mean\n",
      "continue to move\n",
      "continue to rise\n",
      "operate to keep\n",
      "expected to put\n",
      "presumed to realize\n",
      "assembled to legislate\n",
      "sought to find\n",
      "tend to view\n",
      "wished to minimize\n",
      "designed to deal\n",
      "ordered to retain\n",
      "refused to permit\n",
      "refuse to exercise\n",
      "prepared to read\n",
      "wants to displace\n",
      "authorized to fashion\n",
      "choose to assert\n",
      "used to impose\n",
      "chooses to enforce\n",
      "heard to object\n",
      "goes to prove\n",
      "intended to obstruct\n",
      "entitled to sue\n",
      "entitled to sue\n",
      "appear to permit\n",
      "applied to eliminate\n",
      "entitled to sue\n",
      "entitled to sue\n",
      "elected to file\n",
      "elect to continue\n",
      "intended to ease\n",
      "permitted to survive\n",
      "furnished to probe\n",
      "want to make\n",
      "designed to minimize\n",
      "designed to elicit\n",
      "continued to arrive\n",
      "coded to permit\n",
      "wishing to sell\n",
      "endeavored to maintain\n",
      "directed to provide\n",
      "seeking to continue\n",
      "refused to assume\n",
      "concerned to leave\n",
      "attempt to settle\n",
      "continue to make\n",
      "seems to increase\n",
      "exists to show\n",
      "learning to control\n",
      "want to explore\n",
      "struggling to meet\n",
      "trying to learn\n",
      "continues to increase\n",
      "like to tease\n",
      "begins to decline\n",
      "begins to substitute\n",
      "learned to cooperate\n",
      "begins to participate\n",
      "helping to make\n",
      "failing to achieve\n",
      "trying to say\n",
      "learn to identify\n",
      "failing to make\n",
      "needs to know\n",
      "fails to meet\n",
      "expected to administer\n",
      "used to store\n",
      "permitted to see\n",
      "expected to study\n",
      "wish to note\n",
      "required to furnish\n",
      "want to provide\n",
      "attempt to represent\n",
      "hopes to encourage\n",
      "designed to help\n",
      "appointed to act\n",
      "expected to vote\n",
      "appointed to study\n",
      "tended to take\n",
      "attempted to act\n",
      "attempt to act\n",
      "attempt to act\n",
      "intend to act\n",
      "fail to take\n",
      "try to serve\n",
      "tended to use\n",
      "found to behave\n",
      "impelled to make\n",
      "attempt to analyze\n",
      "designed to reflect\n",
      "deemed to vary\n",
      "held to constitute\n",
      "seem to support\n",
      "designed to cover\n",
      "found to vary\n",
      "taken to rest\n",
      "needs to know\n",
      "attempts to stand\n",
      "wishing to know\n",
      "made to appear\n",
      "attempts to supply\n",
      "like to record\n",
      "claims to show\n",
      "mean to assert\n",
      "mean to assert\n",
      "prepared to say\n",
      "mean to say\n",
      "sought to express\n",
      "said to learn\n",
      "mean to say\n",
      "meant to say\n",
      "meant to say\n",
      "meant to express\n",
      "forced to go\n",
      "disposed to quarrel\n",
      "seem to present\n",
      "allowed to move\n",
      "tended to reflect\n",
      "beginning to appreciate\n",
      "begun to disturb\n",
      "venture to assign\n",
      "crystallized to find\n",
      "begin to show\n",
      "beginning to expand\n",
      "dared to give\n",
      "continued to employ\n",
      "began to creep\n",
      "seems to appear\n",
      "rode to arrest\n",
      "serve to quiet\n",
      "decided to ride\n",
      "prepared to fight\n",
      "allowed to see\n",
      "refused to give\n",
      "compelled to kill\n",
      "desiring to leave\n",
      "wanted to clean\n",
      "needed to hire\n",
      "continued to spring\n",
      "extended to include\n",
      "intending to use\n",
      "need to commit\n",
      "sought to place\n",
      "want to know\n",
      "want to know\n",
      "serve to contrast\n",
      "obligated to regard\n",
      "tried to make\n",
      "attempting to falsify\n",
      "continued to accuse\n",
      "continued to accuse\n",
      "dare to instigate\n",
      "acting to deliver\n",
      "seeking to free\n",
      "endeavoring to deliver\n",
      "doomed to suffer\n",
      "adopted to accomplish\n",
      "fails to honor\n",
      "began to mix\n",
      "began to paint\n",
      "trying to simulate\n",
      "begun to broaden\n",
      "seems to contain\n",
      "tends to assert\n",
      "seem to thrust\n",
      "seems to thrust\n",
      "shaded to pry\n",
      "tend to assert\n",
      "continued to remain\n",
      "tried to escape\n",
      "taxed to pay\n",
      "come to pass\n",
      "seem to believe\n",
      "continues to rise\n",
      "continue to charge\n",
      "beginning to discover\n",
      "continues to offer\n",
      "wants to see\n",
      "come to dominate\n",
      "put to compete\n",
      "refuse to acknowledge\n",
      "liked to work\n",
      "tend to vote\n",
      "going to cure\n",
      "tended to overlook\n",
      "made to replace\n",
      "decided to strip\n",
      "made to satisfy\n",
      "arranged to fit\n",
      "needed to take\n",
      "tried to restrict\n",
      "led to speculate\n",
      "intended to fill\n",
      "restored to go\n",
      "appear to push\n",
      "began to wash\n",
      "wish to address\n",
      "want to meet\n",
      "appeared to evoke\n",
      "tend to blunt\n",
      "try to build\n",
      "tend to become\n",
      "presume to lecture\n",
      "attempting to acquaint\n",
      "failed to state\n",
      "like to make\n",
      "presume to speak\n",
      "mean to live\n",
      "made to look\n",
      "designed to discover\n",
      "seems to use\n",
      "used to describe\n",
      "postulated to explain\n",
      "used to support\n",
      "seem to corroborate\n",
      "wants to hear\n",
      "comes to represent\n",
      "used to accompany\n",
      "seems to symbolize\n",
      "begins to appear\n",
      "begins to ramble\n",
      "help to set\n",
      "calculated to put\n",
      "decided to write\n",
      "seemed to open\n",
      "combine to create\n",
      "learned to use\n",
      "began to take\n",
      "wanted to tell\n",
      "wanted to substitute\n",
      "want to make\n",
      "come to determine\n",
      "begun to ebb\n",
      "intended to incorporate\n",
      "led to postulate\n",
      "hope to discover\n",
      "tended to emphasize\n",
      "fails to explore\n",
      "seeks to make\n",
      "helping to define\n",
      "trying to avoid\n",
      "trying to get\n",
      "made to symbolize\n",
      "kneels to kiss\n",
      "serve to travesty\n",
      "used to equate\n",
      "altered to show\n",
      "altered to show\n",
      "taken to branch\n",
      "attempt to execute\n",
      "used to name\n",
      "used to name\n",
      "used to generate\n",
      "used to select\n",
      "used to select\n",
      "used to specify\n",
      "used to specify\n",
      "expected to serve\n",
      "used to eliminate\n",
      "designed to handle\n",
      "made to take\n",
      "tended to float\n",
      "began to decrease\n",
      "began to build\n",
      "used to provide\n",
      "tend to ensure\n",
      "seems to strive\n",
      "stated to emphasize\n",
      "channeled to produce\n",
      "expected to replace\n",
      "developed to attack\n",
      "needed to translate\n",
      "needed to make\n",
      "used to deny\n",
      "required to localize\n",
      "found to protect\n",
      "used to demonstrate\n",
      "shown to undergo\n",
      "extended to include\n",
      "shown to undergo\n",
      "allowed to go\n",
      "used to classify\n",
      "found to keep\n",
      "made to group\n",
      "continued to supply\n",
      "serves to inactivate\n",
      "needed to inactivate\n",
      "thought to offer\n",
      "serves to extend\n",
      "served to extend\n",
      "required to accomplish\n",
      "found to compare\n",
      "required to remove\n",
      "required to cut\n",
      "tends to push\n",
      "required to cut\n",
      "seen to correlate\n",
      "beginning to advance\n",
      "managed to grow\n",
      "started to open\n",
      "seem to justify\n",
      "claimed to give\n",
      "used to denote\n",
      "required to cause\n",
      "combined to attain\n",
      "used to slit\n",
      "hope to compete\n",
      "helped to alleviate\n",
      "calculated to expand\n",
      "lowered to permit\n",
      "appears to produce\n",
      "intended to cover\n",
      "established to cover\n",
      "repeated to evaluate\n",
      "varied to obtain\n",
      "varied to conform\n",
      "used to provide\n",
      "allowed to reach\n",
      "required to counteract\n",
      "appear to hold\n",
      "utilized to alleviate\n",
      "investigated to allow\n",
      "enlarged to require\n",
      "employed to reduce\n",
      "wait to see\n",
      "adjusted to supply\n",
      "utilized to direct\n",
      "tried to make\n",
      "jumping to anticipate\n",
      "tried to tempt\n",
      "Try to get\n",
      "bothered to phone\n",
      "allowed to make\n",
      "go to school\n",
      "wants to pay\n",
      "seemed to speak\n",
      "wired to set\n",
      "tried to shake\n",
      "going to follow\n",
      "served to overheat\n",
      "seemed to crouch\n",
      "seemed to advance\n",
      "seemed to resist\n",
      "began to write\n",
      "refuse to mention\n",
      "needed to eat\n",
      "wanting to know\n",
      "stop to grasp\n",
      "dared to defy\n",
      "hoping to store\n",
      "going to get\n",
      "want to get\n",
      "trying to talk\n",
      "determined to go\n",
      "proposed to rebuild\n",
      "going to stay\n",
      "plan to repair\n",
      "Hope to see\n",
      "used to take\n",
      "want to kill\n",
      "intend to go\n",
      "wanted to hurt\n",
      "bother to think\n",
      "delighted to see\n",
      "began to weep\n",
      "began to move\n",
      "tried to push\n",
      "tried to rescue\n",
      "seemed to hold\n",
      "began to think\n",
      "strove to think\n",
      "run to tell\n",
      "fail to hear\n",
      "dared to wait\n",
      "dared to pat\n",
      "trying to push\n",
      "began to whirl\n",
      "started to worry\n",
      "tried to push\n",
      "wanted to get\n",
      "tryin to fuck\n",
      "tried to stifle\n",
      "seeking to kill\n",
      "failed to check\n",
      "tried to shut\n",
      "refuses to believe\n",
      "begun to study\n",
      "amazed to discover\n",
      "appear to reject\n",
      "trying to write\n",
      "want to weep\n",
      "love to know\n",
      "like to know\n",
      "seem to think\n",
      "striving to appear\n",
      "begin to get\n",
      "called to take\n",
      "bother to shave\n",
      "tried to stop\n",
      "going to stop\n",
      "like to hear\n",
      "itch to relieve\n",
      "prefer to eat\n",
      "wanted to wipe\n",
      "survive to talk\n",
      "fit to kill\n",
      "began to whip\n",
      "seems to hover\n",
      "waiting to know\n",
      "want to go\n",
      "decided to remain\n",
      "appeared to provide\n",
      "tried to outface\n",
      "turned to smirk\n",
      "used to tell\n",
      "began to speak\n",
      "tried to force\n",
      "knelt to tell\n",
      "tried to live\n",
      "seemed to grow\n",
      "continued to find\n",
      "going to allow\n",
      "continued to proclaim\n",
      "came to warn\n",
      "refused to believe\n",
      "refused to agree\n",
      "wanted to run\n",
      "going to comply\n",
      "started to run\n",
      "crouch to get\n",
      "seem to help\n",
      "close to emit\n",
      "twitching to dislodge\n",
      "descended to blot\n",
      "strained to hear\n",
      "going to let\n",
      "begun to walk\n",
      "wanted to take\n",
      "wanted to talk\n",
      "want to bring\n",
      "consented to postpone\n",
      "meant to keep\n",
      "want to call\n",
      "expecting to find\n",
      "designed to serve\n",
      "made to flow\n",
      "wanting to draw\n",
      "persuaded to come\n",
      "told to ask\n",
      "wish to make\n",
      "promised to speak\n",
      "moved to distort\n",
      "wanted to emphasize\n",
      "liking to work\n",
      "tries to unteach\n",
      "began to worry\n",
      "tried to insist\n",
      "moving to take\n",
      "tried to contain\n",
      "takes to drink\n",
      "aim to keep\n",
      "tried to find\n",
      "stopped to say\n",
      "trying to contain\n",
      "needed to say\n",
      "forgot to order\n",
      "began to dance\n",
      "planned to use\n",
      "began to shave\n",
      "began to pack\n",
      "seemed to care\n",
      "rose to speak\n",
      "continue to plague\n",
      "live to see\n",
      "poised to pour\n",
      "Remember to call\n",
      "trying to reach\n",
      "tried to reach\n",
      "used to love\n",
      "wants to go\n",
      "wanted to wring\n",
      "got to dancing\n",
      "trying to pick\n",
      "began to laugh\n",
      "trying to find\n",
      "going to get\n",
      "want to fight\n",
      "wanting to sock\n",
      "trying to take\n",
      "want to hear\n",
      "seemed to feel\n",
      "trying to help\n",
      "wait to get\n",
      "expect to escape\n",
      "try to fathom\n",
      "allowed to spend\n",
      "try to make\n",
      "wanted to know\n",
      "tried to get\n",
      "tempted to ask\n",
      "decided to tell\n",
      "surprised to find\n",
      "wished to show\n",
      "like to bring\n",
      "beg to inquire\n",
      "wanted to visit\n",
      "like to enact\n",
      "wished to create\n",
      "wish to deceive\n",
      "want to create\n",
      "going to take\n",
      "going to lose\n",
      "consented to meet\n",
      "rose to go\n",
      "chosen to read\n",
      "started to cross\n",
      "seemed to think\n",
      "started to undo\n",
      "longed to tell\n",
      "chose to read\n",
      "served to increase\n",
      "refused to bring\n",
      "got to stop\n",
      "want to take\n",
      "tried to order\n",
      "seeking to create\n",
      "hope to accomplish\n",
      "attempt to rise\n",
      "tried to rise\n",
      "began to crawl\n",
      "failed to reach\n",
      "began to creep\n",
      "began to crawl\n",
      "promised to take\n",
      "meant to shout\n",
      "longed to increase\n",
      "want to begin\n",
      "seemed to imply\n",
      "stopped to admire\n",
      "stayed to visit\n",
      "want to get\n",
      "tried to remember\n",
      "began to riffle\n",
      "promise to make\n",
      "like to travel\n",
      "tried to repair\n",
      "used to play\n",
      "beginning to thin\n",
      "fail to let\n",
      "lean to reach\n",
      "trying to get\n",
      "want to see\n",
      "beginning to see\n",
      "bother to wipe\n",
      "fit to shake\n",
      "going to wake\n",
      "care to get\n",
      "tried to stop\n",
      "expected to hear\n",
      "got to expect\n",
      "going to put\n",
      "got to thaw\n",
      "want to touch\n",
      "made to fall\n",
      "come to rest\n",
      "trying to attain\n",
      "stopped to gaze\n",
      "begun to turn\n",
      "beginning to cook\n",
      "began to develop\n",
      "begun to buy\n",
      "want to thin\n",
      "planned to graduate\n",
      "going to tell\n",
      "trying to get\n",
      "want to roast\n",
      "preferred to sit\n",
      "liked to sit\n",
      "seemed to come\n",
      "plan to conduct\n",
      "required to detect\n",
      "obliged to prepare\n",
      "began to rise\n",
      "attempting to hide\n",
      "begun to protest\n",
      "come to clean\n",
      "rose to put\n",
      "managed to persuade\n",
      "offered to prevail\n",
      "want to hear\n",
      "fumbling to untie\n",
      "want to leave\n",
      "going to work\n",
      "want to keep\n",
      "like to think\n",
      "began to wrap\n",
      "going to put\n",
      "agreed to correspond\n",
      "lived to see\n",
      "longing to fall\n",
      "ask to see\n",
      "seemed to stride\n",
      "agreed to think\n",
      "wished to spend\n",
      "dared to ask\n",
      "supposed to buy\n",
      "planning to greet\n",
      "began to wonder\n",
      "refused to let\n",
      "wanted to kill\n",
      "wanted to go\n",
      "seem to know\n",
      "going to become\n",
      "going to kill\n",
      "like to tell\n",
      "want to see\n",
      "get to come\n",
      "like to dance\n",
      "like to dance\n",
      "wanted to believe\n",
      "trying to put\n",
      "started to say\n",
      "Forgot to get\n",
      "started to say\n",
      "trying to make\n",
      "want to sit\n",
      "trying to get\n",
      "want to lease\n",
      "wanted to shadow\n",
      "trying to make\n",
      "tried to shadow\n",
      "going to join\n",
      "try to keep\n",
      "like to run\n",
      "wanted to case\n",
      "going to join\n",
      "wanted to hang\n",
      "go to pick\n",
      "began to back\n",
      "paused to feel\n",
      "decided to risk\n",
      "turned to face\n",
      "began to feel\n",
      "started to sweep\n",
      "startled to find\n",
      "meant to convey\n",
      "going to leave\n",
      "returning to seek\n",
      "bother to look\n",
      "try to run\n",
      "going to make\n",
      "began to wave\n",
      "gone to get\n",
      "Want to try\n",
      "going to call\n",
      "want to find\n",
      "want to see\n",
      "designed to put\n",
      "turned to see\n",
      "forced to use\n",
      "trying to drag\n",
      "start to angle\n",
      "tried to flatten\n",
      "managed to hunch\n",
      "brought to make\n",
      "surprised to find\n",
      "started to back\n",
      "want to try\n",
      "trying to catch\n",
      "used to keep\n",
      "forget to turn\n",
      "promised to observe\n",
      "started to plod\n",
      "tried to turn\n",
      "beginning to feel\n",
      "decided to indulge\n",
      "forgotten to turn\n",
      "meant to shut\n",
      "want to leave\n",
      "want to go\n",
      "got to remember\n",
      "got to put\n",
      "threaten to call\n",
      "need to take\n",
      "going to get\n",
      "get to know\n",
      "paused to look\n",
      "seemed to remember\n",
      "Happened to hear\n",
      "got to get\n",
      "begun to tell\n",
      "begun to question\n",
      "began to doubt\n",
      "wished to frighten\n",
      "need to break\n",
      "wished to make\n",
      "tried to give\n",
      "got to eat\n",
      "attempt to frighten\n",
      "trying to find\n",
      "want to talk\n",
      "refusing to bear\n",
      "Try to find\n",
      "want to go\n",
      "like to make\n",
      "going to go\n",
      "Remember to tell\n",
      "wanted to know\n",
      "tried to think\n",
      "tried to make\n",
      "began to nod\n",
      "began to sink\n",
      "tried to think\n",
      "tried to explain\n",
      "going to die\n",
      "going to die\n",
      "managed to cover\n",
      "going to believe\n",
      "expected to stand\n",
      "made to include\n",
      "bothering to whisper\n",
      "waiting to see\n",
      "agreed to fill\n",
      "waiting to report\n",
      "going to like\n",
      "going to louse\n",
      "installed to film\n",
      "going to see\n",
      "expect to get\n",
      "going to stand\n",
      "try to stop\n",
      "going to ask\n",
      "hoping to hear\n",
      "constrained to add\n",
      "wants to pass\n",
      "try to phone\n",
      "like to sing\n",
      "forced to undergo\n",
      "supposed to make\n",
      "wants to ask\n",
      "decided to let\n",
      "got to go\n",
      "tried to ignore\n",
      "going to keep\n",
      "startled to meet\n",
      "came to examine\n",
      "tried to bring\n",
      "reaching to release\n",
      "waiting to report\n",
      "used to paint\n",
      "Begin to look\n",
      "wanted to see\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Failing to find\n",
      "Try to forget\n",
      "seen to leave\n",
      "forced to give\n",
      "inclined to admit\n",
      "began to make\n",
      "professed to know\n",
      "asked to use\n",
      "leaving to keep\n",
      "fit to consult\n",
      "asked to see\n",
      "wanted to make\n",
      "continued to discharge\n",
      "seem to belong\n",
      "began to flicker\n",
      "trying to wreck\n",
      "fit to touch\n",
      "going to take\n",
      "trying to clear\n",
      "want to spend\n",
      "paused to look\n",
      "going to allow\n",
      "like to talk\n",
      "planning to set\n",
      "bent to examine\n",
      "turned to jump\n",
      "started to retch\n",
      "going to get\n",
      "come to recognize\n",
      "expected to report\n",
      "failed to see\n",
      "failed to notify\n",
      "failed to co-operate\n",
      "stopping to hear\n",
      "want to talk\n",
      "going to cost\n",
      "wanted to ask\n",
      "going to get\n",
      "going to swear\n",
      "tried to keep\n",
      "think to look\n",
      "tried to find\n",
      "bear to hold\n",
      "began to pace\n",
      "tried to tell\n",
      "intended to scare\n",
      "began to think\n",
      "hired to take\n",
      "going to send\n",
      "helped to create\n",
      "wanted to give\n",
      "led to believe\n",
      "trying to escape\n",
      "began to thrash\n",
      "get to work\n",
      "come to work\n",
      "want to see\n",
      "wanted to get\n",
      "want to go\n",
      "managed to swallow\n",
      "threatened to fire\n",
      "happen to see\n",
      "going to eat\n",
      "began to weep\n",
      "happens to ask\n",
      "want to rent\n",
      "Try to imagine\n",
      "promised to pay\n",
      "planning to remarry\n",
      "determined to get\n",
      "seemed to swell\n",
      "surprised to meet\n",
      "trying to tell\n",
      "known to run\n",
      "seem to preserve\n",
      "got to understand\n",
      "got to know\n",
      "came to ask\n",
      "asked to see\n",
      "began to abuse\n",
      "hurry to hang\n",
      "seemed to mind\n",
      "started to cross\n",
      "started to curse\n",
      "offering to buy\n",
      "began to feel\n",
      "seem to wink\n",
      "continued to stare\n",
      "beginning to feel\n",
      "like to listen\n",
      "want to study\n",
      "relieved to see\n",
      "seemed to notice\n",
      "decided to stay\n",
      "startled to see\n",
      "began to feel\n",
      "bothered to ask\n",
      "beginning to take\n",
      "began to wish\n",
      "want to encourage\n",
      "began to talk\n",
      "paused to moisten\n",
      "went to join\n",
      "got to go\n",
      "trying to get\n",
      "want to know\n",
      "want to take\n",
      "want to leave\n",
      "got to assume\n",
      "got to keep\n",
      "burning to light\n",
      "decided to leave\n",
      "set to stay\n",
      "going to kill\n",
      "go to bat\n",
      "stopped to cherish\n",
      "struggling to bridge\n",
      "learning to think\n",
      "delighted to encounter\n",
      "wanted to explain\n",
      "taught to grow\n",
      "Taught to grow\n",
      "opened to sell\n",
      "required to assume\n",
      "want to make\n",
      "got to hold\n",
      "want to inquire\n",
      "seemed to spend\n",
      "preoccupied to cook\n",
      "asked to speak\n",
      "pacing to stare\n",
      "wished to make\n",
      "began to build\n",
      "needed to carry\n",
      "meaning to live\n",
      "agreed to help\n",
      "agreed to take\n",
      "contract to let\n",
      "refused to believe\n",
      "meant to invade\n",
      "going to turn\n",
      "got to intercept\n",
      "permitted to go\n",
      "failed to anticipate\n",
      "needed to make\n",
      "use to make\n",
      "help to repel\n",
      "seems to shield\n",
      "pretending to sleep\n",
      "threatening to report\n",
      "seem to concentrate\n",
      "want to give\n",
      "trying to pull\n",
      "adjusted to operate\n",
      "like to see\n",
      "bent to observe\n",
      "forced to accompany\n",
      "fear to tread\n",
      "programed to compute\n",
      "remember to program\n",
      "directed to develop\n",
      "schooled to examine\n",
      "appeared to require\n",
      "encouraged to develop\n",
      "remembered to introduce\n",
      "guided to make\n",
      "tried to run\n",
      "tried to tell\n",
      "tried to ask\n",
      "want to ask\n",
      "going to come\n",
      "going to happen\n",
      "going to happen\n",
      "going to take\n",
      "inclined to think\n",
      "manage to follow\n",
      "wanting to tell\n",
      "tried to write\n",
      "exhausted to stay\n",
      "afford to lose\n",
      "afford to pay\n",
      "used to work\n",
      "going to give\n",
      "began to rock\n",
      "tried to call\n",
      "stoop to catch\n",
      "began to paw\n",
      "began to nod\n",
      "hate to leave\n",
      "want to leave\n",
      "groped to reassemble\n",
      "begun to blow\n",
      "began to dissolve\n",
      "meant to help\n",
      "began to tire\n",
      "riding to kill\n",
      "got to get\n",
      "trying to decide\n",
      "try to cut\n",
      "began to weep\n",
      "going to walk\n",
      "tried to veer\n",
      "managed to bat\n",
      "Try to find\n",
      "began to explode\n",
      "racing to join\n",
      "began to snap\n",
      "began to buckle\n",
      "want to go\n",
      "seem to think\n",
      "goin' to move\n",
      "goin' to go\n",
      "goin' to help\n",
      "employed to live\n",
      "trying to keep\n",
      "try to cut\n",
      "going to wait\n",
      "started to slump\n",
      "started to run\n",
      "goin' to kill\n",
      "fighting to hold\n",
      "started to slump\n",
      "forgot to aim\n",
      "started to raise\n",
      "seem to tell\n",
      "want to see\n",
      "meant to insult\n",
      "meant to say\n",
      "tried to step\n",
      "tried to break\n",
      "seemed to pull\n",
      "seemed to change\n",
      "want to know\n",
      "start to work\n",
      "straining to stay\n",
      "Go to sleep\n",
      "stop to graze\n",
      "bothered to speak\n",
      "attempted to salvage\n",
      "seemed to indicate\n",
      "attempted to form\n",
      "tried to pick\n",
      "appeared to disapprove\n",
      "expected to find\n",
      "decided to see\n",
      "go to look\n",
      "wished to prepare\n",
      "hoping to see\n",
      "cease to feel\n",
      "forced to admit\n",
      "expect to see\n",
      "liked to liberate\n",
      "relieved to see\n",
      "try to thank\n",
      "like to starve\n",
      "hoped to succeed\n",
      "hated to answer\n",
      "got to get\n",
      "swung to see\n",
      "offered to walk\n",
      "wanted to avoid\n",
      "dared to enter\n",
      "failing to understand\n",
      "pause to consider\n",
      "chose to ignore\n",
      "dare to face\n",
      "continued to move\n",
      "started to brush\n",
      "trying to focus\n",
      "tried to fling\n",
      "want to tell\n",
      "attempted to kiss\n",
      "going to listen\n",
      "going to listen\n",
      "want to miss\n",
      "goin' to say\n",
      "going to take\n",
      "supposed to walk\n",
      "waiting to catch\n",
      "like to bother\n",
      "attempted to push\n",
      "going to kill\n",
      "going to kill\n",
      "trying to keep\n",
      "seeming to like\n",
      "got to take\n",
      "going to need\n",
      "want to put\n",
      "hoped to catch\n",
      "went to look\n",
      "wanting to unlock\n",
      "amazed to see\n",
      "refused to give\n",
      "tried to lift\n",
      "forced to agree\n",
      "fails to substantiate\n",
      "wants to see\n",
      "beginning to get\n",
      "continued to smile\n",
      "turned to add\n",
      "wanted to get\n",
      "continued to snort\n",
      "started to reach\n",
      "beginning to recover\n",
      "going to talk\n",
      "like to kill\n",
      "going to hear\n",
      "wanted to hear\n",
      "came to investigate\n",
      "managed to duck\n",
      "began to focus\n",
      "trying to yank\n",
      "began to snort\n",
      "wanted to show\n",
      "tried to start\n",
      "going to let\n",
      "going to fight\n",
      "attempting to speak\n",
      "longing to catch\n",
      "rejoicing to think\n",
      "like to get\n",
      "tried to go\n",
      "seemed to make\n",
      "aim to give\n",
      "want to trade\n",
      "beginning to turn\n",
      "forced to maintain\n",
      "hope to locate\n",
      "paused to gather\n",
      "bothering to note\n",
      "turned to survey\n",
      "started to struggle\n",
      "started to return\n",
      "pretended to give\n",
      "served to increase\n",
      "determined to drive\n",
      "try to go\n",
      "began to run\n",
      "continued to come\n",
      "continued to camouflage\n",
      "Forced to realize\n",
      "trying to grab\n",
      "trying to read\n",
      "began to drink\n",
      "started to slide\n",
      "mean to pry\n",
      "going to sell\n",
      "pleased to hear\n",
      "starting to itch\n",
      "like to think\n",
      "supposed to meet\n",
      "wait to get\n",
      "seem to dwell\n",
      "feared to dwell\n",
      "tried to date\n",
      "trying to cut\n",
      "beginning to collect\n",
      "determined to find\n",
      "put to use\n",
      "determined to spend\n",
      "hoping to escape\n",
      "pleased to note\n",
      "calculated to glamorize\n",
      "began to explain\n",
      "want to see\n",
      "wanted to turn\n",
      "began to whip\n",
      "failed to find\n",
      "meant to save\n",
      "wanted to waste\n",
      "want to get\n",
      "going to explode\n",
      "seemed to disintegrate\n",
      "intended to propitiate\n",
      "embarrassing to see\n",
      "going to keel\n",
      "seemed to enjoy\n",
      "like to know\n",
      "deserve to lie\n",
      "want to see\n",
      "pretending to joke\n",
      "used to try\n",
      "trying to look\n",
      "began to watch\n",
      "want to go\n",
      "seemed to sink\n",
      "began to ooze\n",
      "began to move\n",
      "seemed to know\n",
      "trying to talk\n",
      "continued to lash\n",
      "turned to look\n",
      "struggled to control\n",
      "deserved to live\n",
      "like to hunt\n",
      "left to say\n",
      "like to recognize\n",
      "wanting to fly\n",
      "dispatched to harry\n",
      "started to buckle\n",
      "began to crawl\n",
      "wanted to lose\n",
      "going to show\n",
      "going to give\n",
      "trying to size\n",
      "seemed to promise\n",
      "hate to run\n",
      "turned to face\n",
      "wish to enter\n",
      "intend to speak\n",
      "determined to make\n",
      "want to upset\n",
      "resolved to make\n",
      "left to distract\n",
      "vied to knock\n",
      "equipped to die\n",
      "tried to roll\n",
      "commenced to weep\n",
      "began to uncap\n",
      "going to get\n",
      "expected to risk\n",
      "decided to set\n",
      "seem to locate\n",
      "allowed to come\n",
      "allowed to leave\n",
      "sent to clean\n",
      "proceeded to disturb\n",
      "came to teach\n",
      "wait to get\n",
      "get to school\n",
      "beginning to stir\n",
      "got to get\n",
      "seemed to think\n",
      "trying to get\n",
      "struggling to get\n",
      "mean to pull\n",
      "got to take\n",
      "trying to think\n",
      "seeming to scream\n",
      "sought to make\n",
      "proceeded to give\n",
      "advised to flee\n",
      "like to hurt\n",
      "hurt to beat\n",
      "want to go\n",
      "chanced to glance\n",
      "vowed to take\n",
      "started to move\n",
      "began to sizzle\n",
      "cared to see\n",
      "time to pay\n",
      "determined to hold\n",
      "beginning to fold\n",
      "wanted to smoke\n",
      "seem to get\n",
      "trying to find\n",
      "like to keep\n",
      "seem to snap\n",
      "like to think\n",
      "beginning to find\n",
      "beginning to look\n",
      "going to last\n",
      "going to prove\n",
      "hoped to die\n",
      "gone to live\n",
      "stayed to get\n",
      "turned to go\n",
      "going to see\n",
      "going to laugh\n",
      "tried to bite\n",
      "seem to rise\n",
      "come to see\n",
      "got to know\n",
      "seem to take\n",
      "beginning to creep\n",
      "seemed to rain\n",
      "like to hear\n",
      "come to make\n",
      "started to move\n",
      "bent to pick\n",
      "permitted to operate\n",
      "beginning to get\n",
      "seemed to think\n",
      "tried to make\n",
      "wanted to present\n",
      "expected to stay\n",
      "wish to start\n",
      "got to run\n",
      "like to talk\n",
      "disappointed to find\n",
      "tried to reason\n",
      "trying to close\n",
      "want to help\n",
      "surprised to see\n",
      "trying to find\n",
      "neglected to play\n",
      "wanted to call\n",
      "like to offer\n",
      "want to say\n",
      "wished to see\n",
      "overheard to say\n",
      "like to get\n",
      "expected to perform\n",
      "going to bring\n",
      "seek to storm\n",
      "used to defend\n",
      "shocked to find\n",
      "hesitate to speak\n",
      "beginning to study\n",
      "grow to devote\n",
      "wish to turn\n",
      "going to fail\n",
      "wished to change\n",
      "wanted to take\n",
      "wanted to bring\n",
      "like to know\n",
      "intend to marry\n",
      "began to talk\n",
      "used to play\n",
      "trying to get\n",
      "happen to drive\n",
      "hating to get\n",
      "try to walk\n",
      "left to believe\n",
      "tried to rest\n",
      "dying to defend\n",
      "used to kid\n",
      "wanted to paint\n",
      "going to organize\n",
      "try to paint\n",
      "used to hang\n",
      "prepared to worship\n",
      "want to stir\n",
      "beginning to gather\n",
      "tried to believe\n",
      "used to say\n",
      "began to shudder\n",
      "come to understand\n",
      "come to see\n",
      "called to say\n",
      "decided to cremate\n",
      "want to meet\n",
      "impelled to kneel\n",
      "trying to touch\n",
      "trying to flatter\n",
      "trying to worry\n",
      "trying to worry\n",
      "want to go\n",
      "like to take\n",
      "wanted to know\n",
      "trying to get\n",
      "gone to purify\n",
      "waiting to see\n",
      "come to skirt\n",
      "trying to make\n",
      "go to sleep\n",
      "tried to emulate\n",
      "began to pulse\n",
      "amazed to find\n",
      "kneeling to tie\n",
      "trying to get\n",
      "trying to smile\n",
      "seemed to float\n",
      "tried to see\n",
      "stop to analyze\n",
      "supposed to joke\n",
      "supposed to handle\n",
      "want to ask\n",
      "got to admit\n",
      "tried to leave\n",
      "began to walk\n",
      "supposed to stay\n",
      "going to tell\n",
      "going to get\n",
      "intended to make\n",
      "began to zip\n",
      "obliged to roll\n",
      "want to stop\n",
      "going to marry\n",
      "liked to hear\n",
      "tempted to tell\n",
      "seemed to mark\n",
      "tried to explain\n",
      "managed to look\n",
      "needed to get\n",
      "answered to find\n",
      "afford to get\n",
      "started to look\n",
      "takes to get\n",
      "going to get\n",
      "tried to quiet\n",
      "trying to sound\n",
      "came to meet\n",
      "seemed to focus\n",
      "want to talk\n",
      "want to see\n",
      "wants to get\n",
      "went to turn\n",
      "surprised to find\n",
      "want to stay\n",
      "going to make\n",
      "hoped to dig\n",
      "trying to make\n",
      "going to lug\n",
      "surprised to see\n",
      "stop to read\n",
      "intended to move\n",
      "rising to sting\n",
      "arranged to live\n",
      "managed to find\n",
      "inclined to wobble\n",
      "supposed to care\n",
      "shuddered to think\n",
      "seemed to understand\n",
      "aroused to go\n",
      "hate to call\n",
      "wish to leave\n",
      "seemed to follow\n",
      "supposed to matter\n",
      "bothered to tell\n",
      "hesitate to use\n",
      "used to say\n",
      "try to persuade\n",
      "wanted to keep\n",
      "trying to keep\n",
      "blushed to admit\n",
      "want to continue\n",
      "chosen to represent\n",
      "want to leave\n",
      "wanted to work\n",
      "seemed to regard\n",
      "forbore to mention\n",
      "managed to open\n",
      "want to encourage\n",
      "want to watch\n",
      "remember to warn\n",
      "used to take\n",
      "want to use\n",
      "started to throw\n",
      "began to swing\n",
      "started to carry\n",
      "began to look\n",
      "going to happen\n",
      "began to walk\n",
      "trying to say\n",
      "trying to say\n",
      "started to say\n",
      "wants to take\n",
      "started to take\n",
      "began to fascinate\n",
      "left to spend\n",
      "seemed to work\n",
      "work to grow\n",
      "trying to talk\n",
      "lied to shorten\n",
      "trying to make\n",
      "wanted to force\n",
      "refused to take\n",
      "seemed to please\n",
      "grew to depend\n",
      "meant to tell\n",
      "trying to pull\n",
      "seemed to shiver\n",
      "trying to remember\n",
      "worked to recall\n",
      "wished to call\n",
      "seemed to stare\n",
      "began to tremble\n",
      "refusing to think\n",
      "refusing to think\n",
      "hoping to frighten\n",
      "wanted to run\n",
      "began to ache\n",
      "began to bother\n",
      "tried to take\n",
      "wanted to kill\n",
      "stopped to see\n",
      "going to tell\n",
      "going to push\n",
      "wanted to slap\n",
      "started to type\n",
      "helped to build\n",
      "refused to drive\n",
      "wanted to go\n",
      "likes to play\n",
      "like to rise\n",
      "tried to push\n",
      "trying to run\n",
      "tried to make\n",
      "used to say\n",
      "come to exist\n",
      "fit to put\n",
      "stoop to lift\n",
      "wanted to draw\n",
      "going to pick\n",
      "intended to wait\n",
      "determined to foil\n",
      "strode to answer\n",
      "trusted to carry\n",
      "seemed to help\n",
      "chose to come\n",
      "tried to ignore\n",
      "liked to break\n",
      "began to aid\n",
      "going to tear\n",
      "like to exhibit\n",
      "forced to make\n",
      "hate to admit\n",
      "got to decide\n",
      "tried to sell\n",
      "try to swing\n",
      "expect to call\n",
      "paused to get\n",
      "proceeded to search\n",
      "began to suspect\n",
      "endeavoring to cut\n",
      "wanted to know\n",
      "daring to commit\n",
      "given to dig\n",
      "urged to attend\n",
      "refused to receive\n",
      "beckoned to cross\n",
      "taken to keep\n",
      "trying to hold\n",
      "managing to get\n",
      "promised to illustrate\n",
      "pretending to black\n",
      "wanted to remind\n",
      "Resolving to get\n",
      "started to start\n",
      "starting to woolgather\n",
      "bound to get\n",
      "wanted to keep\n",
      "looked to see\n",
      "chosen to complement\n",
      "live to hear\n",
      "leaping to light\n",
      "trying to prove\n",
      "trying to determine\n",
      "supposed to put\n",
      "proceeded to neglect\n",
      "care to count\n",
      "shuddered to think\n",
      "telephoned to announce\n",
      "neglected to consider\n",
      "trouble to memorize\n",
      "deigned to appear\n",
      "seemed to understand\n",
      "try to revive\n",
      "seemed to produce\n",
      "returning to jump\n",
      "tried to farm\n",
      "going to set\n",
      "turned to stare\n",
      "seem to think\n",
      "liked to hire\n",
      "remember to telephone\n",
      "like to work\n",
      "like to disclose\n",
      "got to put\n",
      "got to run\n",
      "waiting to get\n",
      "need to worry\n",
      "seems to think\n",
      "tries to baffle\n",
      "mean to reconsider\n",
      "refused to make\n",
      "seems to make\n",
      "seems to refer\n",
      "seems to say\n",
      "delighted to meet\n",
      "like to know\n",
      "regret to say\n",
      "seems to refer\n",
      "come to talk\n",
      "seem to remember\n",
      "want to hear\n",
      "trying to get\n",
      "forgot to say\n",
      "seemed to believe\n",
      "wanted to get\n",
      "wanted to see\n",
      "wanted to touch\n",
      "got to entertain\n",
      "tried to keep\n",
      "going to tell\n",
      "thought to mix\n",
      "going to jump\n",
      "beginning to catch\n",
      "try to see\n",
      "phoned to say\n",
      "bothering to look\n",
      "forced to wipe\n",
      "used to pretend\n",
      "refused to approach\n",
      "used to express\n",
      "proceeds to lash\n",
      "used to hang\n",
      "seeks to expunge\n",
      "trying to redeem\n",
      "seemed to take\n",
      "tried to conceal\n",
      "came to know\n",
      "refuses to continue\n",
      "continue to scrape\n",
      "given to understand\n",
      "propose to vent\n",
      "proceeded to mask\n",
      "withhold to keep\n",
      "begin to wither\n",
      "help to intensify\n",
      "seems to overtake\n",
      "want to buy\n"
     ]
    }
   ],
   "source": [
    "for tagged_sent in brown.tagged_sents():\n",
    "    process(tagged_sent)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 114,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "best ADJ ADV VERB NOUN\n",
      "close ADV ADJ VERB NOUN\n",
      "open ADJ VERB NOUN ADV\n",
      "present ADJ ADV NOUN VERB\n",
      "that ADP DET PRON ADV\n"
     ]
    }
   ],
   "source": [
    "brown_news_tagged = brown.tagged_words(categories='news', tagset='universal')\n",
    "data = nltk.ConditionalFreqDist((word.lower(), tag) for (word, tag) in brown_news_tagged)\n",
    "\n",
    "for word in sorted(data.conditions()):\n",
    "    if len(data[word]) > 3:\n",
    "        tags = [tag for (tag, _) in data[word].most_common()]\n",
    "        print(word, ' '.join(tags))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.3 使用Python字典映射词及其属性"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 2 Python 字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 115,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos = {}\n",
    "pos['colorless'] = 'ADJ'\n",
    "pos['ideas'] = 'N'\n",
    "pos['sleep'] = 'V'\n",
    "pos['furiously'] = 'ADV'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 116,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'colorless': 'ADJ', 'furiously': 'ADV', 'ideas': 'N', 'sleep': 'V'}"
      ]
     },
     "execution_count": 116,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pos"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 117,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['colorless', 'ideas', 'sleep', 'furiously']"
      ]
     },
     "execution_count": 117,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(pos)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 118,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['colorless', 'furiously', 'ideas', 'sleep']"
      ]
     },
     "execution_count": 118,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sorted(pos)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 119,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['colorless', 'ideas']"
      ]
     },
     "execution_count": 119,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[w for w in pos if w.endswith('s')]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 120,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "colorless: ADJ\n",
      "furiously: ADV\n",
      "ideas: N\n",
      "sleep: V\n"
     ]
    }
   ],
   "source": [
    "for word in sorted(pos):\n",
    "    print(word + \":\", pos[word])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 122,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['colorless', 'ideas', 'sleep', 'furiously']"
      ]
     },
     "execution_count": 122,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(pos.keys())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['ADJ', 'N', 'V', 'ADV']"
      ]
     },
     "execution_count": 123,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(pos.values())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 124,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('colorless', 'ADJ'), ('ideas', 'N'), ('sleep', 'V'), ('furiously', 'ADV')]"
      ]
     },
     "execution_count": 124,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(pos.items())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 125,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "colorless: ADJ\n",
      "furiously: ADV\n",
      "ideas: N\n",
      "sleep: V\n"
     ]
    }
   ],
   "source": [
    "for key, val in sorted(pos.items()):\n",
    "    print(key + \":\", val)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 3 定义字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 126,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos = dict(colorless='ADJ', ideas='N', sleep='V', furiously='ADV')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 4 默认字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 127,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from collections import defaultdict"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 128,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "frequency = defaultdict(int)\n",
    "frequency['colorless'] = 4"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 130,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "execution_count": 130,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "frequency['ideas']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 131,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos = nltk.defaultdict(list)\n",
    "pos['sleep'] = ['NOUN', 'VERB']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 132,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[]"
      ]
     },
     "execution_count": 132,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pos['ideas']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 133,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos = defaultdict(lambda: 'NOUN')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 134,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos['colorless'] = 'ADJ'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 135,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'NOUN'"
      ]
     },
     "execution_count": 135,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pos['blog']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 136,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('colorless', 'ADJ'), ('blog', 'NOUN')]"
      ]
     },
     "execution_count": 136,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list(pos.items())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 137,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "alice = nltk.corpus.gutenberg.words('carroll-alice.txt')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 140,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "vocab = nltk.FreqDist(alice)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 146,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "v1000 = [word for (word, _) in vocab.most_common(1000)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 147,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "mapping = defaultdict(lambda: 'UNK')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 148,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "for v in v1000:\n",
    "    mapping[v] = v"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 149,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "alice2 = [mapping[v] for v in alice]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 151,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['[', 'Alice', \"'\", 's', 'Adventures', 'in', 'Wonderland', 'by', 'UNK', 'UNK']"
      ]
     },
     "execution_count": 151,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "alice2[:10]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "##  5 递增地更新字典"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 152,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "counts = defaultdict(int)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 153,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "for (word, tag) in nltk.corpus.brown.tagged_words(categories='news', tagset='universal'):\n",
    "    counts[tag] += 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 154,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "30654"
      ]
     },
     "execution_count": 154,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "counts['NOUN']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 155,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['.',\n",
       " 'ADJ',\n",
       " 'ADP',\n",
       " 'ADV',\n",
       " 'CONJ',\n",
       " 'DET',\n",
       " 'NOUN',\n",
       " 'NUM',\n",
       " 'PRON',\n",
       " 'PRT',\n",
       " 'VERB',\n",
       " 'X']"
      ]
     },
     "execution_count": 155,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sorted(counts)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 156,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from operator import itemgetter"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 157,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('NOUN', 30654),\n",
       " ('VERB', 14399),\n",
       " ('ADP', 12355),\n",
       " ('.', 11928),\n",
       " ('DET', 11389),\n",
       " ('ADJ', 6706),\n",
       " ('ADV', 3349),\n",
       " ('CONJ', 2717),\n",
       " ('PRON', 2535),\n",
       " ('PRT', 2264),\n",
       " ('NUM', 2166),\n",
       " ('X', 92)]"
      ]
     },
     "execution_count": 157,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sorted(counts.items(), key=itemgetter(1), reverse=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 158,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "last_letters = defaultdict(list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 159,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "words = nltk.corpus.words.words('en')\n",
    "for word in words:\n",
    "    key = word[-2:]\n",
    "    last_letters[key].append(word)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 161,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['abactinally',\n",
       " 'abandonedly',\n",
       " 'abasedly',\n",
       " 'abashedly',\n",
       " 'abashlessly',\n",
       " 'abbreviately',\n",
       " 'abdominally',\n",
       " 'abhorrently',\n",
       " 'abidingly',\n",
       " 'abiogenetically',\n",
       " 'abiologically',\n",
       " 'abjectly',\n",
       " 'ableptically',\n",
       " 'ably',\n",
       " 'abnormally',\n",
       " 'abominably',\n",
       " 'aborally',\n",
       " 'aboriginally',\n",
       " 'abortively',\n",
       " 'aboundingly',\n",
       " 'abridgedly',\n",
       " 'abruptedly',\n",
       " 'abruptly',\n",
       " 'abscondedly',\n",
       " 'absently',\n",
       " 'absentmindedly',\n",
       " 'absolutely',\n",
       " 'absolutistically',\n",
       " 'absorbedly',\n",
       " 'absorbingly',\n",
       " 'absorptively',\n",
       " 'abstemiously',\n",
       " 'abstinently',\n",
       " 'abstractedly',\n",
       " 'abstractively',\n",
       " 'abstractly',\n",
       " 'abstrusely',\n",
       " 'absurdly',\n",
       " 'abundantly',\n",
       " 'abusedly',\n",
       " 'abusefully',\n",
       " 'abusively',\n",
       " 'abysmally',\n",
       " 'academically',\n",
       " 'acceleratedly',\n",
       " 'accentually',\n",
       " 'acceptably',\n",
       " 'acceptedly',\n",
       " 'accessarily',\n",
       " 'accessibly',\n",
       " 'accessively',\n",
       " 'accessorily',\n",
       " 'accidentally',\n",
       " 'accidently',\n",
       " 'accommodately',\n",
       " 'accommodatingly',\n",
       " 'accordantly',\n",
       " 'accordingly',\n",
       " 'accountably',\n",
       " 'accumulatively',\n",
       " 'accurately',\n",
       " 'accursedly',\n",
       " 'accusably',\n",
       " 'accusatively',\n",
       " 'accusatorially',\n",
       " 'accusingly',\n",
       " 'accustomedly',\n",
       " 'acervately',\n",
       " 'acetometrically',\n",
       " 'achingly',\n",
       " 'achromatically',\n",
       " 'acicularly',\n",
       " 'acidimetrically',\n",
       " 'acidly',\n",
       " 'acknowledgedly',\n",
       " 'acoustically',\n",
       " 'acquiescently',\n",
       " 'acquiescingly',\n",
       " 'acquisitively',\n",
       " 'acridly',\n",
       " 'acrimoniously',\n",
       " 'acrobatically',\n",
       " 'acrocephaly',\n",
       " 'acrogenously',\n",
       " 'acrologically',\n",
       " 'acromegaly',\n",
       " 'acronically',\n",
       " 'acropetally',\n",
       " 'acrostically',\n",
       " 'actinally',\n",
       " 'actinically',\n",
       " 'actinoelectrically',\n",
       " 'actionably',\n",
       " 'actively',\n",
       " 'actually',\n",
       " 'actuarially',\n",
       " 'acutely',\n",
       " 'Adamically',\n",
       " 'adaptationally',\n",
       " 'adaptively',\n",
       " 'addedly',\n",
       " 'additionally',\n",
       " 'additively',\n",
       " 'addleheadedly',\n",
       " 'adequately',\n",
       " 'adherently',\n",
       " 'adhesively',\n",
       " 'adiabatically',\n",
       " 'adjacently',\n",
       " 'adjectivally',\n",
       " 'adjectively',\n",
       " 'adjoinedly',\n",
       " 'adjunctively',\n",
       " 'adjunctly',\n",
       " 'adjustably',\n",
       " 'administratively',\n",
       " 'admirably',\n",
       " 'admiredly',\n",
       " 'admiringly',\n",
       " 'admissibly',\n",
       " 'admittedly',\n",
       " 'admonishingly',\n",
       " 'admonitively',\n",
       " 'admonitorily',\n",
       " 'adnominally',\n",
       " 'adolescently',\n",
       " 'adoptedly',\n",
       " 'adoptively',\n",
       " 'adorably',\n",
       " 'adorally',\n",
       " 'adoringly',\n",
       " 'adorningly',\n",
       " 'adradially',\n",
       " 'adroitly',\n",
       " 'adscititiously',\n",
       " 'adulterately',\n",
       " 'adulterously',\n",
       " 'adumbratively',\n",
       " 'advancingly',\n",
       " 'advantageously',\n",
       " 'adventitiously',\n",
       " 'adventuresomely',\n",
       " 'adventurously',\n",
       " 'adverbially',\n",
       " 'adversatively',\n",
       " 'adversely',\n",
       " 'advertently',\n",
       " 'advisably',\n",
       " 'advisedly',\n",
       " 'advisorily',\n",
       " 'aerially',\n",
       " 'aerobically',\n",
       " 'aerobiologically',\n",
       " 'aerobiotically',\n",
       " 'aerogenically',\n",
       " 'aeronautically',\n",
       " 'aerophilately',\n",
       " 'aeroscopically',\n",
       " 'aesthetically',\n",
       " 'aetiotropically',\n",
       " 'affably',\n",
       " 'affectedly',\n",
       " 'affectingly',\n",
       " 'affectionally',\n",
       " 'affectionately',\n",
       " 'affectively',\n",
       " 'affinely',\n",
       " 'affinitatively',\n",
       " 'affirmably',\n",
       " 'affirmatively',\n",
       " 'affirmingly',\n",
       " 'afflictingly',\n",
       " 'afflictively',\n",
       " 'affluently',\n",
       " 'affrightedly',\n",
       " 'affrightfully',\n",
       " 'affrightingly',\n",
       " 'affrontedly',\n",
       " 'affrontingly',\n",
       " 'agamically',\n",
       " 'agamogenetically',\n",
       " 'agedly',\n",
       " 'aggravatingly',\n",
       " 'aggregately',\n",
       " 'aggressively',\n",
       " 'aggrievedly',\n",
       " 'agilely',\n",
       " 'agitatedly',\n",
       " 'agnatically',\n",
       " 'agnostically',\n",
       " 'agonistically',\n",
       " 'agonizedly',\n",
       " 'agonizingly',\n",
       " 'agrarianly',\n",
       " 'agreeably',\n",
       " 'agreeingly',\n",
       " 'agriculturally',\n",
       " 'agrobiologically',\n",
       " 'agrogeologically',\n",
       " 'agrologically',\n",
       " 'aguishly',\n",
       " 'aimfully',\n",
       " 'aimlessly',\n",
       " 'airily',\n",
       " 'airtightly',\n",
       " 'alarmedly',\n",
       " 'alarmingly',\n",
       " 'alchemically',\n",
       " 'alcoholically',\n",
       " 'aldermanly',\n",
       " 'alertly',\n",
       " 'algebraically',\n",
       " 'algometrically',\n",
       " 'alimentally',\n",
       " 'alimentatively',\n",
       " 'alkalimetrically',\n",
       " 'allegedly',\n",
       " 'allegorically',\n",
       " 'allenarly',\n",
       " 'alleviatingly',\n",
       " 'alliably',\n",
       " 'allicholly',\n",
       " 'alliteratively',\n",
       " 'allochirally',\n",
       " 'allogenically',\n",
       " 'allopathetically',\n",
       " 'allopathically',\n",
       " 'allopatrically',\n",
       " 'allothigenetically',\n",
       " 'allotropically',\n",
       " 'allowably',\n",
       " 'allowedly',\n",
       " 'alluringly',\n",
       " 'allusively',\n",
       " 'Ally',\n",
       " 'ally',\n",
       " 'almightily',\n",
       " 'alodially',\n",
       " 'alogically',\n",
       " 'aloofly',\n",
       " 'alphabetically',\n",
       " 'alpinely',\n",
       " 'alterably',\n",
       " 'alternately',\n",
       " 'alternatingly',\n",
       " 'alternatively',\n",
       " 'altimetrically',\n",
       " 'altruistically',\n",
       " 'aly',\n",
       " 'amateurishly',\n",
       " 'amatively',\n",
       " 'amatorially',\n",
       " 'amazedly',\n",
       " 'amazingly',\n",
       " 'ambagiously',\n",
       " 'ambassadorially',\n",
       " 'ambidextrously',\n",
       " 'ambiguously',\n",
       " 'ambilateralaterally',\n",
       " 'ambitionlessly',\n",
       " 'ambitiously',\n",
       " 'amblingly',\n",
       " 'ambrosially',\n",
       " 'amenably',\n",
       " 'Americanly',\n",
       " 'ametaboly',\n",
       " 'amethodically',\n",
       " 'amiably',\n",
       " 'amicably',\n",
       " 'amitotically',\n",
       " 'amorously',\n",
       " 'amorphously',\n",
       " 'amphibiously',\n",
       " 'amphibologically',\n",
       " 'amphiboly',\n",
       " 'amphigenously',\n",
       " 'amphimictically',\n",
       " 'amphistyly',\n",
       " 'amphitheatrically',\n",
       " 'amply',\n",
       " 'amusedly',\n",
       " 'amusingly',\n",
       " 'amusively',\n",
       " 'Anabaptistically',\n",
       " 'anacamptically',\n",
       " 'anachronically',\n",
       " 'anachronistically',\n",
       " 'anachronously',\n",
       " 'anacoluthically',\n",
       " 'Anacreontically',\n",
       " 'anacrustically',\n",
       " 'anaerobically',\n",
       " 'anaerobiotically',\n",
       " 'anaesthetically',\n",
       " 'anagogically',\n",
       " 'anagrammatically',\n",
       " 'anally',\n",
       " 'analogically',\n",
       " 'analogously',\n",
       " 'analytically',\n",
       " 'anamnestically',\n",
       " 'anapaestically',\n",
       " 'anarchically',\n",
       " 'anarthrously',\n",
       " 'anathematically',\n",
       " 'Anatoly',\n",
       " 'anatomically',\n",
       " 'ancestorially',\n",
       " 'ancestrally',\n",
       " 'anciently',\n",
       " 'anecdotically',\n",
       " 'anemographically',\n",
       " 'anemometrically',\n",
       " 'anemometrographically',\n",
       " 'anemophily',\n",
       " 'anencephaly',\n",
       " 'anerly',\n",
       " 'anesthetically',\n",
       " 'aneurismally',\n",
       " 'aneurysmally',\n",
       " 'angelically',\n",
       " 'angerly',\n",
       " 'angiomegaly',\n",
       " 'Anglicanly',\n",
       " 'angrily',\n",
       " 'anguishously',\n",
       " 'angularly',\n",
       " 'angulately',\n",
       " 'animally',\n",
       " 'animatedly',\n",
       " 'animately',\n",
       " 'animatingly',\n",
       " 'anisocotyly',\n",
       " 'anisophylly',\n",
       " 'anisotropically',\n",
       " 'anniversarily',\n",
       " 'annoyingly',\n",
       " 'annually',\n",
       " 'annularly',\n",
       " 'anodically',\n",
       " 'anomalistically',\n",
       " 'anomalously',\n",
       " 'anomaly',\n",
       " 'anonymously',\n",
       " 'anorthographically',\n",
       " 'answerably',\n",
       " 'answeringly',\n",
       " 'answerlessly',\n",
       " 'antagonistically',\n",
       " 'antarctically',\n",
       " 'antecedaneously',\n",
       " 'antecedently',\n",
       " 'antediluvially',\n",
       " 'anteriorly',\n",
       " 'anterolaterally',\n",
       " 'anteroposteriorly',\n",
       " 'anteroventrally',\n",
       " 'anthologically',\n",
       " 'anthropologically',\n",
       " 'anthropometrically',\n",
       " 'anthropomorphically',\n",
       " 'anthropomorphologically',\n",
       " 'anthropomorphously',\n",
       " 'anthropopathically',\n",
       " 'anthropophagously',\n",
       " 'antichristianly',\n",
       " 'antichronically',\n",
       " 'anticipatively',\n",
       " 'anticipatorily',\n",
       " 'anticly',\n",
       " 'anticonstitutionally',\n",
       " 'anticyclonically',\n",
       " 'antidotally',\n",
       " 'antidotically',\n",
       " 'antidromically',\n",
       " 'antimonarchically',\n",
       " 'antimonopoly',\n",
       " 'antipathetically',\n",
       " 'antiperistatically',\n",
       " 'antiphonally',\n",
       " 'antiphonically',\n",
       " 'antiphrastically',\n",
       " 'antiquarianly',\n",
       " 'antiquely',\n",
       " 'antirachitically',\n",
       " 'antiseptically',\n",
       " 'antisocialistically',\n",
       " 'antistrophically',\n",
       " 'antitheistically',\n",
       " 'antithetically',\n",
       " 'antitypically',\n",
       " 'antonomastically',\n",
       " 'antrorsely',\n",
       " 'anxiously',\n",
       " 'aoristically',\n",
       " 'apagogically',\n",
       " 'apathetically',\n",
       " 'aperiodically',\n",
       " 'apertly',\n",
       " 'apetaly',\n",
       " 'apheliotropically',\n",
       " 'aphetically',\n",
       " 'aphoristically',\n",
       " 'aphylly',\n",
       " 'apically',\n",
       " 'apishly',\n",
       " 'aplanatically',\n",
       " 'apocalyptically',\n",
       " 'apocryphally',\n",
       " 'apodictically',\n",
       " 'apogamically',\n",
       " 'apogamously',\n",
       " 'apogeotropically',\n",
       " 'apologetically',\n",
       " 'apometaboly',\n",
       " 'apoplectically',\n",
       " 'aposematically',\n",
       " 'apostatically',\n",
       " 'apostolically',\n",
       " 'apothegmatically',\n",
       " 'appallingly',\n",
       " 'apparently',\n",
       " 'appealingly',\n",
       " 'appeasably',\n",
       " 'appeasingly',\n",
       " 'appellatively',\n",
       " 'apperceptively',\n",
       " 'appetently',\n",
       " 'appetizingly',\n",
       " 'applaudably',\n",
       " 'applaudingly',\n",
       " 'applausively',\n",
       " 'appliably',\n",
       " 'applicably',\n",
       " 'applicatively',\n",
       " 'applicatorily',\n",
       " 'appliedly',\n",
       " 'apply',\n",
       " 'applyingly',\n",
       " 'appositely',\n",
       " 'appositionally',\n",
       " 'appositively',\n",
       " 'appraisingly',\n",
       " 'appreciably',\n",
       " 'appreciatingly',\n",
       " 'appreciatively',\n",
       " 'appreciatorily',\n",
       " 'apprehendingly',\n",
       " 'apprehensibly',\n",
       " 'apprehensively',\n",
       " 'appropriately',\n",
       " 'approvedly',\n",
       " 'approvingly',\n",
       " 'approximately',\n",
       " 'approximatively',\n",
       " 'appulsively',\n",
       " 'apsidally',\n",
       " 'aptitudinally',\n",
       " 'aptly',\n",
       " 'aquatically',\n",
       " 'aqueously',\n",
       " 'arabesquely',\n",
       " 'arbitrarily',\n",
       " 'arboreally',\n",
       " 'arborescently',\n",
       " 'Arcadianly',\n",
       " 'archaeologically',\n",
       " 'archaically',\n",
       " 'archetypally',\n",
       " 'archetypically',\n",
       " 'archiepiscopally',\n",
       " 'architectonically',\n",
       " 'architecturally',\n",
       " 'archly',\n",
       " 'arctically',\n",
       " 'arcuately',\n",
       " 'ardently',\n",
       " 'arduously',\n",
       " 'areographically',\n",
       " 'areologically',\n",
       " 'argentometrically',\n",
       " 'argumentatively',\n",
       " 'argutely',\n",
       " 'aridly',\n",
       " 'arightly',\n",
       " 'aristocratically',\n",
       " 'arithmetically',\n",
       " 'aromatically',\n",
       " 'arrantly',\n",
       " 'arrestingly',\n",
       " 'arrhythmically',\n",
       " 'arrogantly',\n",
       " 'arrogatingly',\n",
       " 'arterially',\n",
       " 'artfully',\n",
       " 'articularly',\n",
       " 'articulately',\n",
       " 'artificially',\n",
       " 'artistically',\n",
       " 'artlessly',\n",
       " 'ascendingly',\n",
       " 'ascertainably',\n",
       " 'ascetically',\n",
       " 'aseptically',\n",
       " 'asexually',\n",
       " 'ashamedly',\n",
       " 'ashily',\n",
       " 'Asiatically',\n",
       " 'asininely',\n",
       " 'askingly',\n",
       " 'asperously',\n",
       " 'aspersively',\n",
       " 'aspiringly',\n",
       " 'assembly',\n",
       " 'assentatorily',\n",
       " 'assentingly',\n",
       " 'assertively',\n",
       " 'assertorially',\n",
       " 'assertorically',\n",
       " 'assertorily',\n",
       " 'assessably',\n",
       " 'asseveratingly',\n",
       " 'asseveratively',\n",
       " 'assidually',\n",
       " 'assiduously',\n",
       " 'assignably',\n",
       " 'assishly',\n",
       " 'associatively',\n",
       " 'assumably',\n",
       " 'assumedly',\n",
       " 'assumingly',\n",
       " 'assumptively',\n",
       " 'assuredly',\n",
       " 'assuringly',\n",
       " 'astatically',\n",
       " 'astely',\n",
       " 'asthmatically',\n",
       " 'astigmatically',\n",
       " 'astonishedly',\n",
       " 'astonishingly',\n",
       " 'astoundingly',\n",
       " 'astrally',\n",
       " 'astrictively',\n",
       " 'astringently',\n",
       " 'astrologically',\n",
       " 'astronomically',\n",
       " 'astuciously',\n",
       " 'astutely',\n",
       " 'asymmetrically',\n",
       " 'asymptotically',\n",
       " 'asyndetically',\n",
       " 'atavistically',\n",
       " 'atheistically',\n",
       " 'Athenianly',\n",
       " 'atheologically',\n",
       " 'athletically',\n",
       " 'atmospherically',\n",
       " 'atomically',\n",
       " 'atomistically',\n",
       " 'atonally',\n",
       " 'atoningly',\n",
       " 'atrociously',\n",
       " 'attachedly',\n",
       " 'attemperately',\n",
       " 'attendantly',\n",
       " 'attendingly',\n",
       " 'attentively',\n",
       " 'attently',\n",
       " 'attractingly',\n",
       " 'attractionally',\n",
       " 'attractively',\n",
       " 'attributively',\n",
       " 'attunely',\n",
       " 'atypically',\n",
       " 'audaciously',\n",
       " 'audibly',\n",
       " 'auditorially',\n",
       " 'auditorily',\n",
       " 'augmentatively',\n",
       " 'augmentedly',\n",
       " 'augustly',\n",
       " 'auntly',\n",
       " 'aurally',\n",
       " 'aureately',\n",
       " 'aureously',\n",
       " 'auricularly',\n",
       " 'auriculately',\n",
       " 'aurorally',\n",
       " 'auspiciously',\n",
       " 'austerely',\n",
       " 'auteciously',\n",
       " 'autecologically',\n",
       " 'authentically',\n",
       " 'authenticly',\n",
       " 'authorially',\n",
       " 'authoritatively',\n",
       " 'authorly',\n",
       " 'autobiographically',\n",
       " 'autocatalytically',\n",
       " 'autocephaly',\n",
       " 'autochthonously',\n",
       " 'autocratically',\n",
       " 'autoeciously',\n",
       " 'autoerotically',\n",
       " 'autogenetically',\n",
       " 'autogenously',\n",
       " 'autographically',\n",
       " 'automatically',\n",
       " 'automorphically',\n",
       " 'autonomically',\n",
       " 'autonomously',\n",
       " 'autophytically',\n",
       " 'autoptically',\n",
       " 'autoschediastically',\n",
       " 'autostyly',\n",
       " 'autosymbolically',\n",
       " 'autotropically',\n",
       " 'autumnally',\n",
       " 'auxetically',\n",
       " 'auxiliarly',\n",
       " 'auxinically',\n",
       " 'availably',\n",
       " 'availingly',\n",
       " 'avariciously',\n",
       " 'avengingly',\n",
       " 'averagely',\n",
       " 'aversely',\n",
       " 'avertedly',\n",
       " 'avidiously',\n",
       " 'avidly',\n",
       " 'avoidably',\n",
       " 'avowably',\n",
       " 'avowedly',\n",
       " 'awakeningly',\n",
       " 'awesomely',\n",
       " 'awfully',\n",
       " 'awkwardly',\n",
       " 'axially',\n",
       " 'axiologically',\n",
       " 'axiomatically',\n",
       " 'azimuthally',\n",
       " 'babblingly',\n",
       " 'babblishly',\n",
       " 'babbly',\n",
       " 'babishly',\n",
       " 'babyishly',\n",
       " 'bacchanalianly',\n",
       " 'bachelorly',\n",
       " 'backbitingly',\n",
       " 'backhandedly',\n",
       " 'backwardly',\n",
       " 'bacterially',\n",
       " 'bacteriologically',\n",
       " 'bacterioscopically',\n",
       " 'baddishly',\n",
       " 'badgeringly',\n",
       " 'badgerly',\n",
       " 'badly',\n",
       " 'bafflingly',\n",
       " 'baggily',\n",
       " 'bairnly',\n",
       " 'bakerly',\n",
       " 'bakingly',\n",
       " 'baldly',\n",
       " 'balefully',\n",
       " 'balkingly',\n",
       " 'ballistically',\n",
       " 'bally',\n",
       " 'balmily',\n",
       " 'balsamically',\n",
       " 'banally',\n",
       " 'bandlessly',\n",
       " 'banefully',\n",
       " 'bankruptly',\n",
       " 'banteringly',\n",
       " 'baptismally',\n",
       " 'barbarically',\n",
       " 'barbarously',\n",
       " 'bardily',\n",
       " 'barefacedly',\n",
       " 'barely',\n",
       " 'barfly',\n",
       " 'barkingly',\n",
       " 'barometrically',\n",
       " 'barratrously',\n",
       " 'barrenly',\n",
       " 'barruly',\n",
       " 'basally',\n",
       " 'baselessly',\n",
       " 'basely',\n",
       " 'bashfully',\n",
       " 'basically',\n",
       " 'bastardly',\n",
       " 'bathymetrically',\n",
       " 'bawdily',\n",
       " 'bayardly',\n",
       " 'beadily',\n",
       " 'beamily',\n",
       " 'beamingly',\n",
       " 'bearably',\n",
       " 'bearishly',\n",
       " 'beastily',\n",
       " 'beastlily',\n",
       " 'beastly',\n",
       " 'beatifically',\n",
       " 'beauteously',\n",
       " 'beautifully',\n",
       " 'beckoningly',\n",
       " 'becomingly',\n",
       " 'bedazzlingly',\n",
       " 'beefily',\n",
       " 'beerily',\n",
       " 'beerishly',\n",
       " 'befittingly',\n",
       " 'beggarly',\n",
       " 'beggingly',\n",
       " 'begrudgingly',\n",
       " 'beguilingly',\n",
       " 'behavioristically',\n",
       " 'behoovefully',\n",
       " 'behoovingly',\n",
       " 'beknottedly',\n",
       " 'belatedly',\n",
       " 'believingly',\n",
       " 'bellicosely',\n",
       " 'belligerently',\n",
       " 'belly',\n",
       " 'bely',\n",
       " 'belyingly',\n",
       " 'bemoaningly',\n",
       " 'bemusedly',\n",
       " 'bendingly',\n",
       " 'benedictively',\n",
       " 'beneficently',\n",
       " 'beneficially',\n",
       " 'benevolently',\n",
       " 'benignantly',\n",
       " 'benignly',\n",
       " 'benumbingly',\n",
       " 'beseechingly',\n",
       " 'beseemingly',\n",
       " 'beseemly',\n",
       " 'besiegingly',\n",
       " 'besottedly',\n",
       " 'besottingly',\n",
       " 'bestially',\n",
       " 'besully',\n",
       " 'betterly',\n",
       " 'Beverly',\n",
       " 'bewailingly',\n",
       " 'bewilderedly',\n",
       " 'bewilderingly',\n",
       " 'bewitchingly',\n",
       " 'bewrayingly',\n",
       " 'biannually',\n",
       " 'biaxially',\n",
       " 'Biblically',\n",
       " 'bibliographically',\n",
       " 'bibliophily',\n",
       " 'bibliopolically',\n",
       " 'bibliopoly',\n",
       " 'bibulously',\n",
       " 'biconically',\n",
       " 'biddably',\n",
       " 'bienly',\n",
       " 'biennially',\n",
       " 'bifariously',\n",
       " 'bifidly',\n",
       " 'bifilarly',\n",
       " 'bifurcately',\n",
       " 'bigamously',\n",
       " 'bigotedly',\n",
       " 'bihourly',\n",
       " 'bilaterally',\n",
       " 'bilingually',\n",
       " 'biliously',\n",
       " 'billiardly',\n",
       " 'Billy',\n",
       " 'billy',\n",
       " 'bimanually',\n",
       " 'bimonthly',\n",
       " 'binately',\n",
       " 'bindingly',\n",
       " 'binocularly',\n",
       " 'binomially',\n",
       " 'biochemically',\n",
       " 'bioecologically',\n",
       " 'biogenetically',\n",
       " 'biogeographically',\n",
       " 'biographically',\n",
       " 'biologically',\n",
       " 'biometrically',\n",
       " 'bionomically',\n",
       " 'bipartitely',\n",
       " 'bipinnately',\n",
       " 'biquarterly',\n",
       " 'bisectionally',\n",
       " 'biserially',\n",
       " 'biseriately',\n",
       " 'bisexually',\n",
       " 'bisymmetrically',\n",
       " 'biternately',\n",
       " 'bitingly',\n",
       " 'bitterly',\n",
       " 'biweekly',\n",
       " 'biyearly',\n",
       " 'bizarrely',\n",
       " 'blackbelly',\n",
       " 'blackguardly',\n",
       " 'blackishly',\n",
       " 'blackly',\n",
       " 'blamably',\n",
       " 'blamefully',\n",
       " 'blamelessly',\n",
       " 'blamingly',\n",
       " 'blanchingly',\n",
       " 'blandishingly',\n",
       " 'blandly',\n",
       " 'blankly',\n",
       " 'blasphemously',\n",
       " 'blatantly',\n",
       " 'blately',\n",
       " 'blazingly',\n",
       " 'bleakly',\n",
       " 'bleatingly',\n",
       " 'blenchingly',\n",
       " 'blessedly',\n",
       " 'blessingly',\n",
       " 'blightingly',\n",
       " 'blindedly',\n",
       " 'blindfoldly',\n",
       " 'blindingly',\n",
       " 'blindly',\n",
       " 'blinkingly',\n",
       " 'blissfully',\n",
       " 'blisteringly',\n",
       " 'blithefully',\n",
       " 'blithely',\n",
       " 'blithesomely',\n",
       " 'blizzardly',\n",
       " 'blockheadedly',\n",
       " 'blockishly',\n",
       " 'blolly',\n",
       " 'bloodily',\n",
       " 'bloodlessly',\n",
       " 'bloodthirstily',\n",
       " 'bloomingly',\n",
       " 'blottesquely',\n",
       " 'blottingly',\n",
       " 'blowfly',\n",
       " 'blubberingly',\n",
       " 'bluely',\n",
       " 'bluffly',\n",
       " 'blunderingly',\n",
       " 'bluntly',\n",
       " 'blushfully',\n",
       " 'blushingly',\n",
       " 'blusteringly',\n",
       " 'blusterously',\n",
       " 'boardly',\n",
       " 'boarishly',\n",
       " 'boastfully',\n",
       " 'boatly',\n",
       " 'bobbishly',\n",
       " 'bobfly',\n",
       " 'bodaciously',\n",
       " 'bodily',\n",
       " 'bodingly',\n",
       " 'boilingly',\n",
       " 'boily',\n",
       " 'boisterously',\n",
       " 'boldly',\n",
       " 'bolly',\n",
       " 'bolographically',\n",
       " 'Bolshevistically',\n",
       " 'bombastically',\n",
       " 'bonairly',\n",
       " 'bonally',\n",
       " 'bonelessly',\n",
       " 'bonnily',\n",
       " 'boobily',\n",
       " 'bookishly',\n",
       " 'booly',\n",
       " 'boomingly',\n",
       " 'boorishly',\n",
       " 'bootlessly',\n",
       " 'boozily',\n",
       " 'boringly',\n",
       " 'botanically',\n",
       " 'botchedly',\n",
       " 'botcherly',\n",
       " 'botchily',\n",
       " 'botfly',\n",
       " 'botryoidally',\n",
       " 'bottomlessly',\n",
       " 'bounceably',\n",
       " 'bouncingly',\n",
       " 'boundedly',\n",
       " 'boundingly',\n",
       " 'boundlessly',\n",
       " 'boundly',\n",
       " 'bounteously',\n",
       " 'bountifully',\n",
       " 'bovinely',\n",
       " 'bowingly',\n",
       " 'bowly',\n",
       " 'boyishly',\n",
       " 'brabblingly',\n",
       " 'brachistocephaly',\n",
       " 'brachycephaly',\n",
       " 'brachydactyly',\n",
       " 'bracingly',\n",
       " 'braggartly',\n",
       " 'braggingly',\n",
       " 'braggishly',\n",
       " 'brainlessly',\n",
       " 'brainsickly',\n",
       " 'brambly',\n",
       " 'brassily',\n",
       " 'bravely',\n",
       " 'brawlingly',\n",
       " 'brawly',\n",
       " 'brawnily',\n",
       " 'brazenfacedly',\n",
       " 'brazenly',\n",
       " 'breakably',\n",
       " 'breathingly',\n",
       " 'breathlessly',\n",
       " 'breezily',\n",
       " 'bremely',\n",
       " 'brickly',\n",
       " 'bridally',\n",
       " 'bridely',\n",
       " 'brieflessly',\n",
       " 'briefly',\n",
       " 'brigandishly',\n",
       " 'brightly',\n",
       " 'brilliantly',\n",
       " 'brimfully',\n",
       " 'brimmingly',\n",
       " 'briskly',\n",
       " 'bristly',\n",
       " 'Britannically',\n",
       " 'Britishly',\n",
       " 'brittlely',\n",
       " 'broadly',\n",
       " 'broilingly',\n",
       " 'brokenheartedly',\n",
       " 'brokenly',\n",
       " 'brolly',\n",
       " 'bromidically',\n",
       " 'bromometrically',\n",
       " 'bronchially',\n",
       " 'broodingly',\n",
       " 'brotherly',\n",
       " 'brownly',\n",
       " 'brusquely',\n",
       " 'brutally',\n",
       " 'brutely',\n",
       " 'brutishly',\n",
       " 'bubblingly',\n",
       " 'bubbly',\n",
       " 'buccally',\n",
       " 'buckishly',\n",
       " 'bucolically',\n",
       " 'buirdly',\n",
       " 'bulkily',\n",
       " 'bullheadedly',\n",
       " 'bullishly',\n",
       " 'bully',\n",
       " 'bumpily',\n",
       " 'bumpingly',\n",
       " 'bumpkinly',\n",
       " 'bumptiously',\n",
       " 'bunchily',\n",
       " 'bungerly',\n",
       " 'bunglingly',\n",
       " 'buoyantly',\n",
       " 'burbly',\n",
       " 'burdensomely',\n",
       " 'bureaucratically',\n",
       " 'burglariously',\n",
       " 'burlesquely',\n",
       " 'burlily',\n",
       " 'burly',\n",
       " 'burningly',\n",
       " 'bushily',\n",
       " 'busily',\n",
       " 'bustlingly',\n",
       " 'butcherly',\n",
       " 'butterfly',\n",
       " 'butyrically',\n",
       " 'buxomly',\n",
       " 'buzzardly',\n",
       " 'buzzingly',\n",
       " 'byously',\n",
       " 'Byronically',\n",
       " 'cabalistically',\n",
       " 'cacophonically',\n",
       " 'cacophonously',\n",
       " ...]"
      ]
     },
     "execution_count": 161,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "last_letters['ly']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 163,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "anagrams = nltk.defaultdict(list)\n",
    "for word in words:\n",
    "    key = ''.join(sorted(word))\n",
    "    anagrams[key].append(word)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 164,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['entrail', 'latrine', 'ratline', 'reliant', 'retinal', 'trenail']"
      ]
     },
     "execution_count": 164,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "anagrams['aeilnrt']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 165,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "anagrams = nltk.Index((''.join(sorted(w)), w) for w in words)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 166,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['entrail', 'latrine', 'ratline', 'reliant', 'retinal', 'trenail']"
      ]
     },
     "execution_count": 166,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "anagrams['aeilnrt']"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 6 复杂的键和值"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 167,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "pos = defaultdict(lambda: defaultdict(int))\n",
    "\n",
    "brown_news_tagged = nltk.corpus.brown.tagged_words(categories='news', tagset='universal')\n",
    "\n",
    "for ((w1, t1), (w2, t2)) in nltk.bigrams(brown_news_tagged):\n",
    "    pos[(t1, w2)][t2] += 1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 168,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "defaultdict(int, {'ADJ': 11, 'NOUN': 5})"
      ]
     },
     "execution_count": 168,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pos[('DET', 'right')]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 7 颠倒字典"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.4 自动标注"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 169,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from nltk.corpus import brown\n",
    "\n",
    "brown_tagged_sents = brown.tagged_sents(categories='news')\n",
    "brown_sents = brown.sents(categories='news')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 1 默认标注器"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "> 默认的标注器给每一个单独的词分配标记，即使是之前从未遇到过的词。碰巧的是，一旦我们处理了几千词的英文文本之后，大多数新词都将是名词。正如我们将看到的，这意味着，默认标注器可以帮助我们提高语言处理系统的稳定性。我们将很快回来讲述这个。"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 170,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'NN'"
      ]
     },
     "execution_count": 170,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tags = [tag for (word, tag) in brown.tagged_words(categories='news')]\n",
    "nltk.FreqDist(tags).max()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 172,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "raw = 'I do not like green eggs and ham, I do not like them Sam I am!'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 173,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tokens = word_tokenize(raw)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 174,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('I', 'NN'),\n",
       " ('do', 'NN'),\n",
       " ('not', 'NN'),\n",
       " ('like', 'NN'),\n",
       " ('green', 'NN'),\n",
       " ('eggs', 'NN'),\n",
       " ('and', 'NN'),\n",
       " ('ham', 'NN'),\n",
       " (',', 'NN'),\n",
       " ('I', 'NN'),\n",
       " ('do', 'NN'),\n",
       " ('not', 'NN'),\n",
       " ('like', 'NN'),\n",
       " ('them', 'NN'),\n",
       " ('Sam', 'NN'),\n",
       " ('I', 'NN'),\n",
       " ('am', 'NN'),\n",
       " ('!', 'NN')]"
      ]
     },
     "execution_count": 174,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 把所有词都标成一个词性，就是出现最多次的那个词性\n",
    "default_tagger = nltk.DefaultTagger('NN')\n",
    "default_tagger.tag(tokens)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 175,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.13089484257215028"
      ]
     },
     "execution_count": 175,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "default_tagger.evaluate(brown_tagged_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 2 正则表达式标注器"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 176,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    " patterns = [\n",
    "...     (r'.*ing$', 'VBG'),               # gerunds\n",
    "...     (r'.*ed$', 'VBD'),                # simple past\n",
    "...     (r'.*es$', 'VBZ'),                # 3rd singular present\n",
    "...     (r'.*ould$', 'MD'),               # modals\n",
    "...     (r'.*\\'s$', 'NN$'),               # possessive nouns\n",
    "...     (r'.*s$', 'NNS'),                 # plural nouns\n",
    "...     (r'^-?[0-9]+(.[0-9]+)?$', 'CD'),  # cardinal numbers\n",
    "...     (r'.*', 'NN')                     # nouns (default)\n",
    "... ]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 178,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('``', 'NN'),\n",
       " ('Only', 'NN'),\n",
       " ('a', 'NN'),\n",
       " ('relative', 'NN'),\n",
       " ('handful', 'NN'),\n",
       " ('of', 'NN'),\n",
       " ('such', 'NN'),\n",
       " ('reports', 'NNS'),\n",
       " ('was', 'NNS'),\n",
       " ('received', 'VBD'),\n",
       " (\"''\", 'NN'),\n",
       " (',', 'NN'),\n",
       " ('the', 'NN'),\n",
       " ('jury', 'NN'),\n",
       " ('said', 'NN'),\n",
       " (',', 'NN'),\n",
       " ('``', 'NN'),\n",
       " ('considering', 'VBG'),\n",
       " ('the', 'NN'),\n",
       " ('widespread', 'NN'),\n",
       " ('interest', 'NN'),\n",
       " ('in', 'NN'),\n",
       " ('the', 'NN'),\n",
       " ('election', 'NN'),\n",
       " (',', 'NN'),\n",
       " ('the', 'NN'),\n",
       " ('number', 'NN'),\n",
       " ('of', 'NN'),\n",
       " ('voters', 'NNS'),\n",
       " ('and', 'NN'),\n",
       " ('the', 'NN'),\n",
       " ('size', 'NN'),\n",
       " ('of', 'NN'),\n",
       " ('this', 'NNS'),\n",
       " ('city', 'NN'),\n",
       " (\"''\", 'NN'),\n",
       " ('.', 'NN')]"
      ]
     },
     "execution_count": 178,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "regexp_tagger = nltk.RegexpTagger(patterns)\n",
    "regexp_tagger.tag(brown_sents[3])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 179,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.20326391789486245"
      ]
     },
     "execution_count": 179,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "regexp_tagger.evaluate(brown_tagged_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 3 查询标注器"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "> 选择了出现次数最多的词语及其对应的词性作为 词性标注器的初始化，但是有很多词并没有出现，所有性能并没有很高。"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 181,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "fd = nltk.FreqDist(brown.words(categories='news'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 182,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "cfd = nltk.ConditionalFreqDist(brown.tagged_words(categories='news'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 184,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "most_freq_words = fd.most_common(100)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 186,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "likely_tags = dict((word, cfd[word].max()) for (word, _) in most_freq_words)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 188,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "baseline_tagger = nltk.UnigramTagger(model=likely_tags)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 189,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.45578495136941344"
      ]
     },
     "execution_count": 189,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "baseline_tagger.evaluate(brown_tagged_sents)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 190,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "sent = brown.sents(categories='news')[3]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 192,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('``', '``'),\n",
       " ('Only', None),\n",
       " ('a', 'AT'),\n",
       " ('relative', None),\n",
       " ('handful', None),\n",
       " ('of', 'IN'),\n",
       " ('such', None),\n",
       " ('reports', None),\n",
       " ('was', 'BEDZ'),\n",
       " ('received', None),\n",
       " (\"''\", \"''\"),\n",
       " (',', ','),\n",
       " ('the', 'AT'),\n",
       " ('jury', None),\n",
       " ('said', 'VBD'),\n",
       " (',', ','),\n",
       " ('``', '``'),\n",
       " ('considering', None),\n",
       " ('the', 'AT'),\n",
       " ('widespread', None),\n",
       " ('interest', None),\n",
       " ('in', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('election', None),\n",
       " (',', ','),\n",
       " ('the', 'AT'),\n",
       " ('number', None),\n",
       " ('of', 'IN'),\n",
       " ('voters', None),\n",
       " ('and', 'CC'),\n",
       " ('the', 'AT'),\n",
       " ('size', None),\n",
       " ('of', 'IN'),\n",
       " ('this', 'DT'),\n",
       " ('city', None),\n",
       " (\"''\", \"''\"),\n",
       " ('.', '.')]"
      ]
     },
     "execution_count": 192,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "baseline_tagger.tag(sent)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 193,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "# 如果要标注的词不在词表里，就用默认标注器 标成NN--回退\n",
    "baseline_tagger = nltk.UnigramTagger(model=likely_tags, backoff=nltk.DefaultTagger('NN'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 194,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "def performance(cfd, wordlist):\n",
    "    lt = dict((word, cfd[word].max()) for word in wordlist)\n",
    "    baseline_tagger = nltk.UnigramTagger(model=lt, backoff=nltk.DefaultTagger('NN'))\n",
    "    return baseline_tagger.evaluate(brown.tagged_sents(categories='news'))\n",
    "\n",
    "def display():\n",
    "    import pylab\n",
    "    word_freqs = nltk.FreqDist(brown.words(categories='news')).most_common()\n",
    "    words_by_freq = [w for (w, _) in word_freqs]\n",
    "    cfd = nltk.ConditionalFreqDist(brown.tagged_words(categories='news'))\n",
    "    sizes = 2 ** pylab.arange(15)\n",
    "    perfs = [performance(cfd, words_by_freq[:size]) for size in sizes]\n",
    "    pylab.plot(sizes, perfs, '-bo')\n",
    "    pylab.title('Lookup Tagger Performance with Varying Model Size')\n",
    "    pylab.xlabel('Model Size')\n",
    "    pylab.ylabel('Performance')\n",
    "    pylab.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 195,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYUAAAEWCAYAAACJ0YulAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAIABJREFUeJzt3XmcHVWd9/HPNwlL2JEEBLLqsEUNiG1AZVFRDG5BgWEJ\nIALGOIA6Pi6McUE08+D2jDiDYAZZlAYEBGWURdGRVSABISFshrAkEUgCGJYAScjv+eOc2119c7v7\ndqert/t9v1731bdO1a363brV9atzquqUIgIzMzOAIX0dgJmZ9R9OCmZm1sJJwczMWjgpmJlZCycF\nMzNr4aRgZmYtnBTqJOnPkk7s6zgahaQdJd0m6QVJM/s6nv5E0p8kHd7B+Eslfa03Y6qXpPdJurev\n46iXpI0lhaRRdUw7WdKCbi7nW5L+qzuf7WmDMilIekzS+/o6jq6SdK2kF/NrtaRVheFz+jq+juR/\niLU51hckPSDp6PWY5b8Aj0XE5hExo6fiHAwi4r0R8UsASdMl3dCd+UjaLP9e76wx7mxJF61vrNUi\n4oaI2L2n5wsg6fa8A9+lqvzaXL53Gcutl6RDJc2V9LykZZJuqCSbiPhmRJzcl/FVDMqkMFBFxEER\nsVlEbAY0A9+rDEfE9L6Or0LSsHZGLcyxbwF8E7hA0hu7OO8hkoYAY4H7ezg+K4iIF4FfAccWyyVt\nCPwzcGFX59kP1v3DFL6PpO2BicA/+iyiFMcE4FzgZGBL4I3ALGBtX8ZVS8MlBUmfkrRA0rOSrpa0\nQ2HcOyXNlrQi/13nCCpPt33O+F/Kw21qJpJOqxxlSRqXj1KmSfq7pCclfbGbsY/MRz3Lcvy/yRt9\nZfxOhSaX6yT9VNK5hfEnSlqUP/9lSU9J2iePGyrp65IWSlouqVnSVnncrpLW5HW3CLimozgjuQx4\nGdgtz2NfSXdI+oekuyW9qxDX7ZJOl3QHsBL4I3A48PV8JLuvpOGSzsrrb7Gk70vaIH9+cv5Nvy7p\naeDsQtnX8vdZIumDkqZIekTSM5L+TyGGdxXi+7uk/6js4NTahDAtf/Y5Sf9R9dv8i6QH87qfJ+kt\nuXx0/p2W53VbM7lL2k3S0sLwLyQ9URi+vPLZvL6OlvRW4EfAu/N6eqowyxGSrs/x3CppbDs/14XA\nP0vaqFD24fzb/TEv7xuSHs3zuk/ShwpxTVdqzjpL0nPAV5WOhHcqTDNK0kpJW6mqiSVvg/+a57si\nb3cbFsZ/TdLT+Tefps6bci4CpkpSHp4KXAa8Vphnu9tSHj+jskygTW03f/ZH+f/oKUn/WbXu2rMn\n8GBE3JT/P56PiMsi4u95vmco/69KOletLQQvSnpN0ql5XF3b03qJiEH3Ah4D3lej/L3A8vwDbQT8\nJ3BTHvc64DngGGAYcGQe3iaP/zNwIjCedDQyrb3lAacBF+X344AALgE2Bd4CLKsVX1WsFwDfqSrb\nDpgCDCcdbfwGuDSPE/BXYCawIfBu4CXg3Dz+rcDzwN75u/8YWAPsk8d/BbgZ2AHYOC///Dxu1/wd\nzgU2AYbXiHcysCC/HwIcAazK338c8Azwvjzug3kdbJ2nvx1YCOwCbJDX/6XA1wrz/16Ob0ReD7OB\nGYVlrwFOz999eKHsK3l+pwBPAb/Iv8NbgVeAHfM8JgFvB4aSjuIWANPzuI3z97+SVAsaTzryfHce\nfwzweJ6n8vcYlec1L8ewIbAz8ASwfzu/+dPAmwrb1KPA+MK43Qrr6+j8fjpwQ9V8LgWWkrbzDYAr\ngAvaWaZy7IcWyq4CzigMHw5sn3+7Y4AXgBGF5a8BPpW/73DgPOBbhc9/Bbi8ejvJw08Bt+bfdGRe\n78flcQcDi/P63JS0cw9gVDvf5XbSTvwm4D257N78uywH9q5jWzoYWELa5jcj1aRalgmcndfnVqT/\nweuBb9b6blWx7Qq8Cnyf9L+5adX4M8j/q1Xlk0j/K2/q6vbU7f1nT86sv7xoPyn8jNQkUxneDFhN\n2mkdA9xZNf1fChvon4H/l+d9ZEfLo3ZS2LUw/nvAzzr5DhdQlRRqTLM38GR+vzPp6G6jwvgraE0K\n/07eyefhLUhV10pSeBR4V2H8eNJRu2hNCjt0EMtk0tHYP4BngbuBQ/K4bwL/XTX9jcDh+f3twFer\nxlcnhSXAewvDU0hHXpVlvwRsUBXPCmBIHh6Zv8PuhWnmA5Pb+T6nApfk95Wk0FQYfzXw+cJ3+XSN\neewP/K2q7FvA2e0s83LSuZRxwFxS4j6OVNt6ujBdPUnhvwrDHwfu6eC3+w5wdX6/DWnntVsH0z8I\nfKCw/IdrfO/ijn8e8NHC71KdFIoJ6cfAj/L7i8k73Dz8ZupLCicC5wN7APPyuGJS6Ghbuhg4rTBu\nYmWZpIOLVeQDiTz+PcADtb5bjfj2ISWZ5aT/1XPJB1jUSAqkRLwIOLg721N3X33d/tfbdiDtrIDU\npirpGWDHPO7xqukfz+MqppKOZK7oxrIXVc33LV2dgaTNgTNJR9xb5eLh+e8OwLKIeLVqmZsXxrc0\nR0TE85JW5PkKGA1cIykKnx9C2kkArI1c1e3AoxHxTzXKxwJHSjqsULZBjqkYa005vtfT9vep/m2e\niojVVR9dFhGVNtuX89+nC+NfJh0YVNp8f0g6uh5O2gHcWjW/YvPMyspnSevukRqhjwXGSSq2Zw8F\n2jsxfCPpKPLF/P7PwEdISemmdj7TnvZireXnwH2SRgKHAXMj4oHKSEknAJ8DxuSizUhH2RXVv91N\nwFBJ7yCt4+2Ba7sQa2XeO9B2XbW7jVS5nFRjfpX03VrUsS3tQG42K4yjMG4DYH5r6xQi1ZQ6FRG3\nALfkON5Bqvl8mbRjbyM3SV1JOpj6dS7u6vbULY12TuHvpBULgKRNSTu9JdXjsjF5XMVppCx/saSh\nhfKXSM0qFa+vsezRVfPtbAdby6mkI5a3R8QWwIGkjRLgSWBkVftmcZlP5s8CIGkLUvWXSIcclaOn\nrQqvjSNief5IMVl01SLSUVBx3ptGRLFdvt355/ieou3vU/3brE98AP9NOmB4Y163p9O6bjuziNTk\nVKv8warvvXlEfKyd+dxIOhrcL7+/Kb/fPw/Xsr7fm4h4GJhDajI9hsIJZkk7k5pZpwGvi4itSAdG\nxXXTJob8e/2cdNR+DKmJszph16PNNkvb7bldEbEC+F/gBNIFG9WxdbQtPcm6/6vFeNaQtpHK77ll\nRGxDF0XEX0jNv29uZ5JzSPuIbxfKuro9dctgTgob5BOEldcwUrv+JyXtkXee/w7cERGPkU6e7izp\nKEnDlK4DnwD8tjDP1aQjqU2BnytdJQNwD3CEpA0kNQGH1ojn65I2kfQm4JPAL7vxnTYnHUn9Q9II\noHgt+sPAQ8DXchz7kaqzFZcBh0h6ez6Rdzptr3w4BzhD0mgASdtK+kg3YqzlQuAwSQcondAent/X\nSp7tuQT4pqRtJG0LzCCdVOwpmwMrcu3xTaQ28nqdC5wqaXclO+eToZWjws9XtkFJEyXt2c587iMd\n+R1GOte1nPR7f4j2k8LTwOjiidJuuhD4AqmmdEmhfDPSdrIMGJJPbNaqDVb7OekKpiOpOlrvgsuA\nE5UuoNiUttt7Z75IamuvdfDV0bZUWebOkjYDvlH5UE5s5wFnShqRf+vRkt7fWTCS3iPp+FwbI29j\nHyI1eVVP+znS73BsTmIVXd2eumUwJ4VrSFXXyuu0iLgB+DqpXe9J0tHdEQAR8Qzpqov/Qzop+mXg\nw4UjZfJ0q0httNsB5+XE8PU8r+dIVcGLa8RzI+kI64/ADyLi9934Tj8gVa2fIW0gLVcB5Y3ncFLT\n0nPAV0nV6Ffz+L8CXyKdRFySv/+KynjSeY4bgD9JegG4jbRhrreIWAgcQlo3y0lV8s/Rte3vG6RL\nVOeTkvCtOeae8q+kncGLwFl0IWlHxC9I55uuIJ2EvQLYKu9EPgi8k/Sdl5FOVNZsysm/4c3A3yOi\nciXSjaSDkfvaWfx1pHNaS/PVMt31S9I2fU3+X6jEdDfpgGEOaZsZn993KCIeIR2kvBARd3YnoIi4\ninQe8FbSQc/NedSr7X6o9bOLI+K2dka3uy3lZc7Ky3qQdCK56POkI/g5pP+f66gvST5HOlicn7ex\n/yHVYn5UY9ojSefxni5cgfSFrm5P3aW2ich6mqRxpJO4G0REXW2PPbjs3wC3R8T/rTFua9IJ4R0i\n4snejMsag6SLgfsj4js9NL+3ki7+GB7ecZVmMNcUGo6kvZTuixiSm34mk9otK+M/mptuNiMd2d7h\nhGBlkPRPpJr3+es5n49L2jA3l/5f4NdOCOVyUhhcKu3YL5Cuhz4+Iop3BR9GOsm2mHS1xdRej9AG\nPUnfI90zc3pELOls+k6cQmpyfIi0XX92PednnXDzkZmZtXBNwczMWgy4m9dGjBgR48aN6+swzMwG\nlLvuumt5RIzsbLoBlxTGjRvHnDmdXhFnZmYFkqp7bKjJzUdmZtbCScHMzFo4KZiZWQsnBTMza+Gk\nYGZmLZwUzMz6ueZmGDcOhgxJf5ubO/tE9w24S1LNzBpJczNMmwYrV6bhxx9PwwBTS+ioxjUFM7N+\nJAJWrIC//Q1uvRX+9V9bE0LFypUwY0Y5y3dNwcysZK+8AsuWwdKl9b1Wrep8nk880fk03eGkYGbW\nRa+9Bs88U/9O/oUXas9n441hu+1g221h++1h993T++LruOPgyRod3I8Zs25ZT3BSMLOGFwHPP9/x\njr14pL98efpMtaFDYeTI1h36Xnu1vi+WV16bbgrq5Eng3/9+23MKAJtsAjNn9uw6qHBSMLNB6ZVX\nau/Qu9pks/XWrTv0XXaBffddd+deeW29dbpCqCdVTibPmJGajMaMSQmhjJPM4KRgZgNEbzbZVF4j\nRsCGG/bu96xl6tTykkA1JwUz6xP1NNkUX8880/Umm1rNNvU02TSyUpOCpMnAmcBQ4NyIOKNq/NbA\necAbgVdIj4+8r8yYzKw8xSab9trju9pks+uusN9+vdtk08hKSwqShgJnAe8nPRN4tqSrq54Z/FXg\nnoj4mKRd8/QHlBWTmXXNmjXpCL3eyykHU5NNoyqzpjAJWBARCwEkXQpMAYpJYQJwBkBEPChpnKTt\nIuLpEuMya1husrHOlJkUdgQWFYYXA3tVTXMv8HHgZkmTgLHAKKBNUpA0DZgGMKasi3PNBqiXX67v\nSL4yTUdNNpUduptsGldfn2g+AzhT0j3APOCvwGvVE0XELGAWQFNTU43jFrO+1dzcc5cMVpps6m2X\nr6fJZocdYI893GRjnSszKSwBRheGR+WyFhHxPPBJAEkCHgUWlhiTWY/rrMOySl829bbLd7fJprrZ\nxk021h2KWltfT8xYGgY8TDpxvASYDRwVEfML02wFrIyIVZI+BewbEcd2NN+mpqaYM2dOKTGbdVUE\njB4NS5asO26DDdLOeelSWL269ueLTTbtHcW7ycZ6gqS7IqKps+lKqylExBpJJwPXky5JPS8i5kua\nnsefA+wGXCgpgPnACWXFY7a+XnwR7rsP5s2DuXPT33nz4Nlna0+/ejUceKCbbGxgKa2mUBbXFKxs\nr70GCxa03fHPnQsLCw2bm20Gb3lLel1+OTz33LrzGTsWHnus18I261Cf1xTMBoKlS1t3/pW/8+en\nm7AgNdfsvDM0NcEnPwkTJ6ZEMHZsa1POfvv1bodlZmVyUrCG8PLLcP/96yaApUtbp3n969MO/6ST\n0t+JE2G33dJVPB3p7Q7LzMrk5iMbVNauhUcfbbvjnzs3NQetXZumGT4c3vzm1uafytH/yJF9G7tZ\nmdx8ZIPeM8+0bfOfNy+dCH7ppTRegje+Me3wjzyyNQG84Q3p8k4zW5eTgvV7r74KDz647onfv/+9\ndZpttkk7/BNOaD3yf9Ob0rX6ZlY/JwXrNyJSm3z10f9DD6W7fCFdwjlhAhxwQOvOf+LEdD7AN2qZ\nrT8nBesTK1akpp5iu/9996XyirFj0w5/ypTWBLDTTummMDMrh5OClWr1anj44XVP/D7xROs0W26Z\ndvhTp7Ye+b/5zbDFFn0Xt1mjclKwHhEBTz657iWfDzzQ2ivnsGGp9813vQs+85nWq39Gj3bTj1l/\n4aRg6+isx88XX0w3eFUf/Re7e9hxx7TD/8AHWo/+d9kFNtqo97+PmdXPScHaqNXj5/HHw69+lWoD\n8+bBI4+0Tr/ppmmnf8ghre3+b3kLvO51fRO/ma0fJwVr46tfbdtdA6Tmn6uuSkf6e+4Jn/hEawIY\nN849d5oNJk4KBqQawQUXtD0BXCSlewXMbHBzUmhgL78MV14J558Pf/pTKtt449bO4Ir8FFSzxuCK\nf4OJgNtvh09/Ot3wdfTRqUvo005LfQade27q4bPIPX6aNQ7XFBrEU0/BL36RagUPPJB29IcemrqD\n3m+/1vMCY8emv+7x06wxOSkMYqtWwe9+B+edB9demx4e8853ptrAYYe1f3PY1KlOAmaNyklhEJo7\nN9UILroIli+HHXaAL30JjjsuXUFkZtaeUpOCpMnAmaRnNJ8bEWdUjd8SuAgYk2P5QUScX2ZMg9Wz\nz8LFF6dkcPfdqeO4j340NQ8deGC6m9jMrDOl7SokDQXOAt4PLAZmS7o6Iu4vTHYScH9EfETSSOAh\nSc0RsaqsuAaT116DP/whJYJf/zo1F731rfDjH8NRR6XupM3MuqLM48dJwIKIWAgg6VJgClBMCgFs\nLknAZsCzwJoSYxoU/va3lAh+/nNYsiTt/KdPT7WCPfbo6+jMbCArMynsCCwqDC8G9qqa5r+Aq4G/\nA5sDh0fE2uoZSZoGTAMY06AXzL/wAlx+eUoGt9ySrhY66CA480z48Ifdp5CZ9Yy+bmn+AHAP8F7g\njcAfJN0cEc8XJ4qIWcAsSM9o7vUo+0gE3HxzunroiivSYyZ32QW++1045hjYfvu+jtDMBpsyb15b\nAowuDI/KZUWfBK6MZAHwKLBriTH1K83NrX0HjRuXhgEWLYLvfCc9UGb//dNdx0cdBbfdlu4x+PKX\nnRDMrBxl1hRmAztJGk9KBkcAR1VN8wRwAHCzpO2AXYCFJcbUb7TXG+kZZ6RuqSPgPe9Jdxp//OPr\n3mVsZlaG0pJCRKyRdDJwPemS1PMiYr6k6Xn8OcC3gQskzQMEfCUilpcVU38yY0bt3kgfeAC+8Y3U\nE+n48X0Tm5k1LkUMrCb6pqammDNnTl+Hsd6GDEm1gWoSrF3nVLuZ2fqRdFdENHU2nTvE6wOrVsHm\nm9ce16AXV5lZP+Gk0MsWLoR994Xnn1/3LmP3Rmpmfc1JoRddemm64/jhh9MlphdckHolldLfWbPc\nEZ2Z9a2+vk+hIbz0Enzuc/Czn6VeSi++uLWLaicBM+tPXFMo2dy50NSUbkCbMQNuvLE1IZiZ9Teu\nKZQkAs4+G77wBdh669Rx3QEH9HVUZmYdc02hBM8+C4ccAiedBO99L9x7rxOCmQ0MTgo97JZbUk+l\nv/0t/PCH6e+22/Z1VGZm9XFS6CGvvZb6K9p///SAm9tuS01HQ7yGzWwA8TmFHrBkCRx9NPz5z6nj\nurPPbv/5x2Zm/ZmPY7uoumfTL34Rdt8d7ryz9bnITghmNlC5ptAFtXo2/eEPYfRouPXW9KwDM7OB\nzDWFLqjVs2mFE4KZDQZOCl3wxBO1yxcv7t04zMzK4qTQBe31YOqeTc1ssHBS6IKDDlq3zD2bmtlg\n4qRQp3vuSb2a7rZbqhm4Z1MzG4xKvfpI0mTgTNLjOM+NiDOqxn8JqOxShwG7ASMj4tky4+qq555L\n3VZssw387//Cdtv1dURmZuUoraYgaShwFnAQMAE4UtKE4jQR8f2I2CMi9gD+DbixvyWEtWvTjWmL\nFsHllzshmNngVmbz0SRgQUQsjIhVwKXAlA6mPxK4pMR4uuXb34ZrroEf/Qje8Y6+jsbMrFxlJoUd\ngUWF4cW5bB2SNgEmA79qZ/w0SXMkzVm2bFmPB9qea66Bb30Ljj0WPvOZXlusmVmf6S8nmj8C3Npe\n01FEzIqIpohoGjlyZK8EtHBhOoE8cWLqy0jqlcWamfWpMpPCEmB0YXhULqvlCPpB01GxX6Ndd4VX\nX4Urr0yXnZqZNYIyk8JsYCdJ4yVtSNrxX109kaQtgf2B35QYS6cq/Ro9/nh6atrq1ekk81/+0pdR\nmZn1rtKSQkSsAU4GrgceAC6LiPmSpkuaXpj0Y8DvI+KlsmKpR61+jV59NZWbmTUKRURfx9AlTU1N\nMWfOnB6f75AhqYZQTUo1BjOzgUzSXRHR1Nl0/eVEc59zv0ZmZk4KLWbOXPfRme7XyMwaTd1JQdJw\nSYP2qQG77Zaaibbe2v0amVnjqqvvI0kfAX4AbAiMl7QHcHpEfLTM4HrTT38Kw4fDI4+kxGBm1ojq\nrSmcRuq24h8AEXEPML6kmHrdCy/AxRfD4Yc7IZhZY6s3KayOiBVVZQPrsqUONDfDiy/C9OmdT2tm\nNpjV23X2fElHAUMl7QR8FritvLB6TwSccw7ssQdMmtTX0ZiZ9a16awqnAG8CXgUuBlYAny8rqN50\n551w773w6U+7fyMzs7qSQkSsjIgZEfH2/PpaRLxSdnBlqvRztPfeKRlssEFfR2Rm1vfqSgqS/iBp\nq8Lw1pKuLy+schX7OYLUhPTZz6ZyM7NGVm/z0YiI+EdlICKeA7YtJ6Ty1ernaOVK93NkZlZvUlgr\nqaXDB0ljGcBXHz3xRNfKzcwaRb1XH80AbpF0IyBgX2BaaVGVbMyY1qaj6nIzs0ZW74nm64A9gV+S\nnrX8togYsOcUZs6EjTduW+Z+jszMutYh3kbAs8DzwARJ+5UTUvmmToXjjkvv3c+RmVmrevs++i5w\nODAfqDxdIICbSoqrdMOGwaabwooVMHRoX0djZtY/1HtO4WBgl4h4tcxgetMdd0BTkxOCmVlRvc1H\nC4FBc3vXK6/APffAXnv1dSRmZv1LvTWFlcA9kv5I6uoCgIj4bEcfkjQZOBMYCpwbEWfUmObdwI9I\nSWd5ROxfZ0zd9te/wurV6W5mMzNrVW9SuDq/6iZpKHAW8H5gMTBb0tURcX9hmq2AnwCTI+IJSaXf\nENfcDKeckt6fckq6ac0nmM3MkrqSQkRc2I15TwIWRMRCAEmXAlOA+wvTHAVcGRFP5OUs7cZy6lbp\n3qJyN/OSJWkYnBjMzKD+vo92knSFpPslLay8OvnYjsCiwvDiXFa0M7C1pD9LukvSse0sf5qkOZLm\nLFu2rJ6Qa3L3FmZmHav3RPP5wNnAGuA9wM+Bi3pg+cOAtwEfAj4AfF3SztUTRcSsiGiKiKaRI0d2\ne2Hu3sLMrGP1JoXhEfFHQBHxeEScRtqRd2QJMLowPCqXFS0Gro+IlyJiOem+h93rjKnL2uvGwt1b\nmJkl9SaFVyUNAf4m6WRJHwM26+Qzs4GdJI2XtCFwBOuerP4NsI+kYZI2AfYCHuhC/F0ycyZstFHb\nMndvYWbWqt6k8DlgE9JjON8GHAN8oqMPRMQa4GTgetKO/rKImC9puqTpeZoHgOuAucCdpMtW7+vO\nF6nH1Klw/PHpvbu3MDNbV71XH83Ob18EPlnvzCPiGuCaqrJzqoa/D3y/3nmur7Fj098VK2DzzXtr\nqWZmA0O9fR81kbrPHlv8TERMLCmu0ixeDFtu6YRgZlZLvTevNQNfAubR2iHegLR4MYwa1ddRmJn1\nT/UmhWUR0aU7mvsrJwUzs/bVmxS+KelcoLrvoytLiaokzc1w992wdi2MG5euOvJJZjOzVvUmhU8C\nu5I6rSs+T2HAJIVKFxdrc/SPP+4uLszMqikiOp9IeigidumFeDrV1NQUc+bM6fLnxo2r/VzmsWPh\nscfWOywzs35N0l0R0dTZdPXep3CbpAnrGVOfchcXZmadq7f5aG/S8xQeJZ1TEBAD6ZLUMWNq1xTc\nxYWZWat6k8LkUqPoBTNnwgknwKuFB4q6iwszs7Y6bT7KD8u5PneE1+bVC/H1mKlT4aST0nt3cWFm\nVlunNYWIeE3SQ5LGVB6GM1BNmpT+3ncfTBjQZ0jMzMpRb/PR1sB8SXcCL1UKI+KjpURVkpdfTn83\n2aRv4zAz66/qTQpfLzWKXlJ56pqTgplZbfX2knqjpO2At+eiO8t+nnIZnBTMzDpW7zOa/5n0vIPD\ngH8G7pB0aJmBlaHSfDR8eN/GYWbWX9XbfDQDeHuldiBpJHADcEVZgZVh5UrYcEMYOrSvIzEz65/q\nvaN5SFVz0TNd+Gy/sXKlm47MzDpS7479OknXSzpO0nHA76h6olotkibny1kXSDq1xvh3S1oh6Z78\n+kbXwu8aJwUzs4512HwkaaOIeDUiviTp48A+edSsiLiqk88OBc4C3g8sBmZLujoi7q+a9OaI+HA3\n4++Sl192UjAz60hnNYW/AEj6RURcGRFfyK8OE0I2CVgQEQsjYhVwKTBlPePttuZmuPJKWLAg9Zja\n3NxXkZiZ9V+dnWjeUNJRwDtzTaGNTh6ysyOwqDC8GNirxnTvlDQXWAJ8MSLmV08gaRowDWBMN3qw\nqzxLoXL1kZ+lYGZWW2c1henAvsBWwEeqXj3R5HM3MCb3tvqfwK9rTRQRsyKiKSKaRo4c2eWFzJjR\neo9CxcqVqdzMzFp1WFOIiFsk3QYsjoiu9ie6BBhdGB6Vy4rzf77w/hpJP5E0IiKWd3FZHfKzFMzM\n6tPp1UcRsRbozo1qs4GdJI2XtCFwBHB1cQJJr5ek/H5SjueZbiyrQ+21OPlZCmZmbdV7SeofJR1S\n2YHXIyLWACcD1wMPAJdFxHxJ0yVNz5MdCtwn6V7gx8ARUc/zQbto5sx1rzrysxTMzNZV7zOaXwA2\nBV4DXqb1yWtblBveurr7jObmZjjuOFizJj1LYeZMn2Q2s8ZR7zOa6+0Qb/P1D6lvTZ0Kp58Oe+4J\nl1zS19GYmfVP9XaIJ0lHS/p6Hh6dzwEMKKtXwwYb9HUUZmb9V73nFH4CvAM4Kg+/SLpbeUBZvRqG\n1dsFoJlZA6p3F7lXROwp6a8AEfFcvqJoQFmzxjUFM7OO1FtTWJ37Mgpo6Tp7bWlRlcTNR2ZmHas3\nKfwYuAq0fm5zAAAODElEQVTYVtJM4Bbg30uLqiRuPjIz61i9Vx81S7oLOIB0OerBEfFAqZGVwM1H\nZmYd66zr7I1J/R/9EzAP+Gm+KW1Ack3BzKxjnTUfXQg0kRLCQcAPSo+oJBE+p2Bm1pnOksKEiDg6\nIn5K6pJiv16IqRQXXZT+fvvbfp6CmVl7OksKqytvBnKzUXMzTJ/eOlx5noITg5lZW50lhd0lPZ9f\nLwATK+8lPd/JZ/sNP0/BzKw+nT1PYWhvBVImP0/BzKw+9d6nMKD5eQpmZvVpiKQwcyYMH962zM9T\nMDNbV0MkhalT4QeFi2nHjoVZs/w8BTOzag2RFAAOPjj9/elP4bHHnBDMzGopNSlImizpIUkLJJ3a\nwXRvl7RGUneeBV2X115Lf4c0TBo0M+u60naRuVfVs0h3Qk8AjpQ0oZ3pvgv8vqxYANbmPl2HDorr\nqczMylHmcfMkYEFELIyIVcClwJQa050C/ApYWmIsrimYmdWhzF3kjsCiwvDiXNZC0o7Ax4CzO5qR\npGmS5kias2zZsm4F45qCmVnn+vq4+UfAVyKiwwf2RMSsiGiKiKaRI0d2a0GuKZiZda7MjqSXAKML\nw6NyWVETcKkkgBHAByWtiYhf93QwrimYmXWuzKQwG9hJ0nhSMjgCOKo4QUSMr7yXdAHw2zISArim\nYGZWj9J2kblX1ZOB64EHgMsiYr6k6ZKmd/zpnvc//5P+Hn64u842M2uPIqKvY+iSpqammDNnTpc+\n09wMJ54Ir7zSWrbJJr6r2cwah6S7IqKps+kaojFlxoy2CQHcdbaZWS0NkRTcdbaZWX0aIim462wz\ns/o0RFKYORM23rhtmbvONjNbV0MkhalT4StfSe8ld51tZtaehkgKAAcemP5ee627zjYza0/DJIXK\nlbfp5mkzM6vFScHMzFo4KZiZWQsnBTMza+GkYGZmLZwUzMyshZOCmZm1cFIwM7MWTgpmZtbCScHM\nzFo4KZiZWYuGSArNzXD00en9oYf6UZxmZu0pNSlImizpIUkLJJ1aY/wUSXMl3SNpjqR9ejqG5maY\nNg2WLk3DTz+dhp0YzMzWVdozmiUNBR4G3g8sBmYDR0bE/YVpNgNeioiQNBG4LCJ27Wi+XX1G87hx\n8Pjj65aPHZt6SzUzawT94RnNk4AFEbEwIlYBlwJTihNExIvRmpU2BXo8Q/lRnGZm9SszKewILCoM\nL85lbUj6mKQHgd8Bx9eakaRpuXlpzrJly7oUhB/FaWZWvz4/0RwRV+Umo4OBb7czzayIaIqIppEj\nR3Zp/jNnpkdvFvlRnGZmtZWZFJYAowvDo3JZTRFxE/AGSSN6MoipU9OjNyu55PWv96M4zczaM6zE\nec8GdpI0npQMjgCOKk4g6Z+AR/KJ5j2BjYBnejqQqVNh663hQx+C3/wGJk3q6SWYmQ0OpSWFiFgj\n6WTgemAocF5EzJc0PY8/BzgEOFbSauBl4PAo6XKoki6yMjMbVMqsKRAR1wDXVJWdU3j/XeC7ZcZQ\nzXc0m5m1r89PNPcW1xTMzDrXMEmhwjUFM7P2NUxScE3BzKxzDZMUKlxTMDNrX8MkBdcUzMw61zBJ\nocI1BTOz9jVMUnBNwcyscw2RFJqb4VOfSu8//GE/S8HMrD2l3rzWH1QesrNyZRp+8sk0DO7/yMys\n2qCvKcyY0ZoQKlauTOVmZtbWoE8KfsiOmVn9Bn1S8EN2zMzqN+iTgh+yY2ZWv0GfFCoP2RmRH92z\n/fZ+yI6ZWXsG/dVHkBLA8OFwyCFw3XUwcWJfR2Rm1j8N+pqCmZnVr2GSgu9oNjPrXKlJQdJkSQ9J\nWiDp1Brjp0qaK2mepNsk7V5mPGmZZS/BzGzgKi0pSBoKnAUcBEwAjpQ0oWqyR4H9I+ItwLeBWWXF\n45qCmVnnyqwpTAIWRMTCiFgFXApMKU4QEbdFxHN58HZgVInxAK4pmJl1pMyksCOwqDC8OJe15wTg\n2lojJE2TNEfSnGXLlvVgiGZmVtQvTjRLeg8pKXyl1viImBURTRHRNHLkyC7Pv7kZPvOZ9P7AA91L\nqplZe8q8T2EJMLowPCqXtSFpInAucFBEPNPTQbiXVDOz+pVZU5gN7CRpvKQNgSOAq4sTSBoDXAkc\nExEPlxGEe0k1M6tfaTWFiFgj6WTgemAocF5EzJc0PY8/B/gGsA3wE6UzwGsioqkn43AvqWZm9Su1\nm4uIuAa4pqrsnML7E4ETy4xhzBh4/PHa5WZm1la/ONFcJveSamZWv0GfFCq9pI4dm+5RGDvWvaSa\nmbWnYXpJdRIwM+vcoK8pmJlZ/ZwUzMyshZOCmZm1cFIwM7MWTgpmZtZCMcAeNCBpGVDjdrS6jACW\n92A4vWmgxj5Q44aBG/tAjRsGbuwDIe6xEdFpj6IDLimsD0lzerobjd4yUGMfqHHDwI19oMYNAzf2\ngRp3LW4+MjOzFk4KZmbWotGSQmnPgO4FAzX2gRo3DNzYB2rcMHBjH6hxr6OhzimYmVnHGq2mYGZm\nHXBSMDOzFg2TFCRNlvSQpAWSTu0H8YyW9L+S7pc0X9LncvlpkpZIuie/Plj4zL/l+B+S9IFC+dsk\nzcvjfqz8GLsSY38sL+8eSXNy2esk/UHS3/Lfrfth3LsU1us9kp6X9Pn+uM4lnSdpqaT7CmU9to4l\nbSTpl7n8DknjSo79+5IelDRX0lWStsrl4yS9XFj35xQ+06uxtxN3j20bZa7zHhURg/5FehzoI8Ab\ngA2Be4EJfRzT9sCe+f3mwMPABOA04Is1pp+Q494IGJ+/z9A87k5gb0DAtcBBJcf+GDCiqux7wKn5\n/anAd/tb3DW2iaeAsf1xnQP7AXsC95WxjoF/Ac7J748Aflly7AcCw/L77xZiH1ecrmo+vRp7O3H3\n2LZR5jrvyVej1BQmAQsiYmFErAIuBab0ZUAR8WRE3J3fvwA8AOzYwUemAJdGxKsR8SiwAJgkaXtg\ni4i4PdLW9nPg4JLDby++C/P7Cwsx9Ne4DwAeiYiO7o7vs9gj4ibg2Rrx9NQ6Ls7rCuCAnqrt1Io9\nIn4fEWvy4O3AqI7m0Rext7PO29Ov1nlPapSksCOwqDC8mI53wL0qVyPfCtyRi07J1ezzCk0E7X2H\nHfP76vIyBXCDpLskTctl20XEk/n9U8B2+X1/irvoCOCSwnB/X+fQs+u45TN5Z70C2KacsNdxPOkI\numJ8bpq5UdK+hfj6S+w9tW305TqvW6MkhX5L0mbAr4DPR8TzwNmkZq49gCeBH/ZheO3ZJyL2AA4C\nTpK0X3FkPkLqt9c6S9oQ+ChweS4aCOu8jf6+jtsjaQawBmjORU8CY/L29AXgYklb9FV8NQy4bWN9\nNUpSWAKMLgyPymV9StIGpITQHBFXAkTE0xHxWkSsBf6b1PQF7X+HJbStipf+3SJiSf67FLgqx/h0\nrjpXqv5L+1vcBQcBd0fE0zAw1nnWk+u45TOShgFbAs+UFnlaznHAh4GpOamRm1+eye/vIrXN79xf\nYu/hbaPX13l3NEpSmA3sJGl8Pko8Ari6LwPKbYk/Ax6IiP9XKN++MNnHgMqVEFcDR+QrGMYDOwF3\n5uaE5yXtned5LPCbEuPeVNLmlfekE4j35fg+kSf7RCGGfhF3lSMpNB3193Ve0JPruDivQ4E/VXbU\nZZA0Gfgy8NGIWFkoHylpaH7/hhz7wv4Sew9vG726zrutr89099YL+CDpCp9HgBn9IJ59SNX/ucA9\n+fVB4BfAvFx+NbB94TMzcvwPUbjaBWgibayPAP9FvlO9pLjfQLrq4l5gfmVdktpG/wj8DbgBeF1/\niruwzE1JR2dbFsr63TonJa0ngdWkdukTenIdAxuTms8WkK6WeUPJsS8gtadXtvXKVTiH5O3oHuBu\n4CN9FXs7cffYtlHmOu/Jl7u5MDOzFo3SfGRmZnVwUjAzsxZOCmZm1sJJwczMWjgpmJlZCycFawiS\nQtJFheFhkpZJ+m0X5/OYpBHdmUbS8bn3zLmS7pM0JZefLul9XYnDrCzD+joAs17yEvBmScMj4mXg\n/fTiXe2SRpGua98zIlbk7k1GAkTEN3orDrPOuKZgjeQa4EP5ffVdza+T9Ot8FH+7pIm5fBtJv1d6\n5sW5pO6QK585WtKduTO3n1buzG3HtsALwIsAEfFipN41kXSBpEMlNam13/55kiKPf6Ok63IHhDdL\n2rUH14lZG04K1kguJXVNsDEwkdZeaQG+Bfw1IiYCXyV1eQzwTeCWiHgTqZ+nMQCSdgMOB94VqTO3\n14CpHSz7XuBp4FFJ50v6SPUEETEnIvbI87sO+EEeNQs4JSLeBnwR+EnXv7pZfdx8ZA0jIubmbsqP\nJNUaivYhdblARPwp1xC2ID145eO5/HeSnsvTHwC8DZidurhhOK0d1NVa9mu5/5+358/+h6S3RcRp\n1dNKOpz0sJcDczPTO4HL1dr1/kZd++Zm9XNSsEZzNekI/N2sX1/2Ai6MiH+r9wOR+pS5E7hT0h+A\n80lP9mqdqfTmXLZfTiRDgH/k2oNZ6dx8ZI3mPOBbETGvqvxmcvOPpHcDyyM93+Im4KhcfhBQecjK\nH4FDJW2bx71O0tj2FippB0l7For2AB6vmmYr0nmOYyNiGUCO4VFJh+VpJGn3Ln9rszq5pmANJSIW\nAz+uMeo04DxJc4GVtHZx/C3gEknzgduAJ/J87pf0NeD3+Wh+NXASVTv6gg2AH0jaAXgFWAZMr5pm\nCumZ0f9daSrKNYSpwNl5eRuQzo3c27VvblYf95JqZmYt3HxkZmYtnBTMzKyFk4KZmbVwUjAzsxZO\nCmZm1sJJwczMWjgpmJlZi/8PJWbqFjVS1C0AAAAASUVORK5CYII=\n",
      "text/plain": [
       "<matplotlib.figure.Figure at 0x1ec72fb9518>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "display()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.5 N-gram标注"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 1 一元标注"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 197,
   "metadata": {},
   "outputs": [],
   "source": [
    "from nltk.corpus import brown \n",
    "\n",
    "brown_tagged_sents = brown.tagged_sents(categories='news')\n",
    "brown_sents = brown.sents(categories='news')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 200,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "unigram_tagger = nltk.UnigramTagger(brown_tagged_sents)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 201,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('Various', 'JJ'),\n",
       " ('of', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('apartments', 'NNS'),\n",
       " ('are', 'BER'),\n",
       " ('of', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('terrace', 'NN'),\n",
       " ('type', 'NN'),\n",
       " (',', ','),\n",
       " ('being', 'BEG'),\n",
       " ('on', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('ground', 'NN'),\n",
       " ('floor', 'NN'),\n",
       " ('so', 'QL'),\n",
       " ('that', 'CS'),\n",
       " ('entrance', 'NN'),\n",
       " ('is', 'BEZ'),\n",
       " ('direct', 'JJ'),\n",
       " ('.', '.')]"
      ]
     },
     "execution_count": 201,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "unigram_tagger.tag(brown_sents[2007])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 202,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.9349006503968017"
      ]
     },
     "execution_count": 202,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "unigram_tagger.evaluate(brown_tagged_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 2 分离训练和测试数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 210,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "4160\n"
     ]
    }
   ],
   "source": [
    "# 降低训练集的比例，性能会下降\n",
    "size = int(len(brown_tagged_sents) * 0.9)\n",
    "print(size)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 211,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.8121200039868434"
      ]
     },
     "execution_count": 211,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "train_sents = brown_tagged_sents[:size]\n",
    "test_sents = brown_tagged_sents[size:]\n",
    "unigram_tagger = nltk.UnigramTagger(train_sents)\n",
    "unigram_tagger.evaluate(test_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 3 一般的N-gram的标注"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 212,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('Various', 'JJ'),\n",
       " ('of', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('apartments', 'NNS'),\n",
       " ('are', 'BER'),\n",
       " ('of', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('terrace', 'NN'),\n",
       " ('type', 'NN'),\n",
       " (',', ','),\n",
       " ('being', 'BEG'),\n",
       " ('on', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('ground', 'NN'),\n",
       " ('floor', 'NN'),\n",
       " ('so', 'CS'),\n",
       " ('that', 'CS'),\n",
       " ('entrance', 'NN'),\n",
       " ('is', 'BEZ'),\n",
       " ('direct', 'JJ'),\n",
       " ('.', '.')]"
      ]
     },
     "execution_count": 212,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bigram_tagger = nltk.BigramTagger(train_sents)\n",
    "bigram_tagger.tag(brown_sents[2007])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 214,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "unseen_sent = brown_sents[4203]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 215,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('The', 'AT'),\n",
       " ('population', 'NN'),\n",
       " ('of', 'IN'),\n",
       " ('the', 'AT'),\n",
       " ('Congo', 'NP'),\n",
       " ('is', 'BEZ'),\n",
       " ('13.5', None),\n",
       " ('million', None),\n",
       " (',', None),\n",
       " ('divided', None),\n",
       " ('into', None),\n",
       " ('at', None),\n",
       " ('least', None),\n",
       " ('seven', None),\n",
       " ('major', None),\n",
       " ('``', None),\n",
       " ('culture', None),\n",
       " ('clusters', None),\n",
       " (\"''\", None),\n",
       " ('and', None),\n",
       " ('innumerable', None),\n",
       " ('tribes', None),\n",
       " ('speaking', None),\n",
       " ('400', None),\n",
       " ('separate', None),\n",
       " ('dialects', None),\n",
       " ('.', None)]"
      ]
     },
     "execution_count": 215,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bigram_tagger.tag(unseen_sent)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 213,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.10206319146815508"
      ]
     },
     "execution_count": 213,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bigram_tagger.evaluate(test_sents)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 220,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.062095086215488884"
      ]
     },
     "execution_count": 220,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "bigram_tagger_cut = nltk.BigramTagger(train_sents, cutoff=2)\n",
    "bigram_tagger_cut.evaluate(test_sents)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 216,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.0626931127279976"
      ]
     },
     "execution_count": 216,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "trigram_tagger = nltk.TrigramTagger(train_sents)\n",
    "trigram_tagger.evaluate(test_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 4 组合标注器"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 217,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "t0 = nltk.DefaultTagger('NN')\n",
    "t1 = nltk.UnigramTagger(train_sents, backoff=t0)\n",
    "t2 = nltk.BigramTagger(train_sents, backoff=t1)\n",
    "t3 = nltk.TrigramTagger(train_sents, backoff=t2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 221,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.8452108043456593"
      ]
     },
     "execution_count": 221,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "t2.evaluate(test_sents)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 5 标注生词"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "> 一个有用的基于上下文标注生词的方法是限制一个标注器的词汇表为最频繁的n 个词，使用5.3 节中的方法替代每个其他的词为一个特殊的词UNK。训练时，一个unigram 标注器可能会学到UNK 通常是一个名词。然而，n-gram 标注器会检测它的一些其他标记中的上下文。例如：如果前面的词是to（标注为TO），那么UNK 可能会被标注为一个动词。"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 6 存储标注器"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 223,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "import pickle"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 7 性能限制（略）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 229,
   "metadata": {},
   "outputs": [],
   "source": [
    "cfd = nltk.ConditionalFreqDist(((x[1], y[1], z[0]), z[1]) for sent in brown_tagged_sents for x, y, z in nltk.trigrams(sent))\n",
    "ambiguous_contexts = [c for c in cfd.conditions() if len(cfd[c]) > 1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 230,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.049297702068029296"
      ]
     },
     "execution_count": 230,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "sum(cfd[c].N() for c in ambiguous_contexts) / cfd.N()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 8 跨句子边界标注（同4）"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 5.6 基于转换的标注"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 236,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "from nltk.tbl.template import Template\n",
    "from nltk.tag.brill import Pos, Word\n",
    "from nltk.tag import untag, RegexpTagger, BrillTaggerTrainer\n",
    "from nltk.corpus import treebank"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 237,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "training_data = treebank.tagged_sents()[:100]\n",
    "baseline_data = treebank.tagged_sents()[100:200]\n",
    "gold_data = treebank.tagged_sents()[200:300]\n",
    "testing_data = [untag(s) for s in gold_data]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 238,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "patterns = [\n",
    "...     (r'.*ing$', 'VBG'),               # gerunds\n",
    "...     (r'.*ed$', 'VBD'),                # simple past\n",
    "...     (r'.*es$', 'VBZ'),                # 3rd singular present\n",
    "...     (r'.*ould$', 'MD'),               # modals\n",
    "...     (r'.*\\'s$', 'NN$'),               # possessive nouns\n",
    "...     (r'.*s$', 'NNS'),                 # plural nouns\n",
    "...     (r'^-?[0-9]+(.[0-9]+)?$', 'CD'),  # cardinal numbers\n",
    "...     (r'.*', 'NN')                     # nouns (default)\n",
    "... ]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 239,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "backoff = RegexpTagger(patterns)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 240,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.2205942205942206"
      ]
     },
     "execution_count": 240,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "baseline = backoff\n",
    "baseline.evaluate(gold_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 241,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "Template._cleartemplates()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 242,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "templates = [Template(Pos([-1])), Template(Pos([-1]), Word([0]))]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 243,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "tt = BrillTaggerTrainer(baseline, templates, trace=3)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 244,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "TBL train (fast) (seqs: 100; tokens: 2417; tpls: 2; min score: 2; min acc: None)\n",
      "Finding initial useful rules...\n",
      "    Found 876 useful rules.\n",
      "\n",
      "           B      |\n",
      "   S   F   r   O  |        Score = Fixed - Broken\n",
      "   c   i   o   t  |  R     Fixed = num tags changed incorrect -> correct\n",
      "   o   x   k   h  |  u     Broken = num tags changed correct -> incorrect\n",
      "   r   e   e   e  |  l     Other = num tags changed incorrect -> incorrect\n",
      "   e   d   n   r  |  e\n",
      "------------------+-------------------------------------------------------\n",
      "  93  93   0   0  | NN->DT if Pos:NN@[-1] & Word:the@[0]\n",
      "  88  88   0   0  | NN->, if Pos:NN@[-1] & Word:,@[0]\n",
      "  69  69   0   0  | NN->. if Pos:NN@[-1] & Word:.@[0]\n",
      "  51  51   0   0  | NN->IN if Pos:NN@[-1] & Word:of@[0]\n",
      "  38  38   0   0  | NN->TO if Pos:NN@[-1] & Word:to@[0]\n",
      "  34  46  12 130  | NN->IN if Pos:NNS@[-1]\n",
      "  30  33   3   1  | VBZ->NNS if Pos:NN@[-1]\n",
      "  27  27   0   0  | NN->DT if Pos:NN@[-1] & Word:a@[0]\n",
      "  22  27   5  39  | NN->-NONE- if Pos:VBD@[-1]\n",
      "  19  19   0  10  | NN->VB if Pos:TO@[-1]\n"
     ]
    }
   ],
   "source": [
    "tagger1 = tt.train(training_data, max_rules=10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 246,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.39845339845339844"
      ]
     },
     "execution_count": 246,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tagger1.evaluate(gold_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 249,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "TBL train (fast) (seqs: 100; tokens: 2417; tpls: 2; min score: 2; min acc: 0.99)\n",
      "Finding initial useful rules...\n",
      "    Found 876 useful rules.\n",
      "\n",
      "           B      |\n",
      "   S   F   r   O  |        Score = Fixed - Broken\n",
      "   c   i   o   t  |  R     Fixed = num tags changed incorrect -> correct\n",
      "   o   x   k   h  |  u     Broken = num tags changed correct -> incorrect\n",
      "   r   e   e   e  |  l     Other = num tags changed incorrect -> incorrect\n",
      "   e   d   n   r  |  e\n",
      "------------------+-------------------------------------------------------\n",
      "  93  93   0   0  | NN->DT if Pos:NN@[-1] & Word:the@[0]\n",
      "  88  88   0   0  | NN->, if Pos:NN@[-1] & Word:,@[0]\n",
      "  69  69   0   0  | NN->. if Pos:NN@[-1] & Word:.@[0]\n",
      "  51  51   0   0  | NN->IN if Pos:NN@[-1] & Word:of@[0]\n",
      "  38  38   0   0  | NN->TO if Pos:NN@[-1] & Word:to@[0]\n",
      "  30  30   0   0  | NN->DT if Pos:NN@[-1] & Word:a@[0]\n",
      "  19  19   0  10  | NN->VB if Pos:TO@[-1]\n",
      "  19  19   0   0  | NN->. if Pos:NNS@[-1] & Word:.@[0]\n",
      "  19  19   0   0  | NN->CC if Pos:NN@[-1] & Word:and@[0]\n",
      "  18  18   0   0  | CD->-NONE- if Pos:NN@[-1] & Word:0@[0]\n",
      "  17  17   0   3  | NN$->POS if Pos:NN@[-1]\n",
      "  17  17   0   0  | NN->IN if Pos:NN@[-1] & Word:in@[0]\n",
      "  16  16   0   0  | NN->IN if Pos:NN@[-1] & Word:for@[0]\n",
      "  15  15   0   0  | NN->, if Pos:NNS@[-1] & Word:,@[0]\n",
      "  15  15   0   0  | NN->-NONE- if Pos:NN@[-1] & Word:*U*@[0]\n",
      "  14  14   0   0  | NN->VBD if Pos:NN@[-1] & Word:said@[0]\n",
      "  12  12   0   0  | NN->-NONE- if Pos:NN@[-1] & Word:*@[0]\n",
      "  12  12   0   0  | NN->IN if Pos:NNS@[-1] & Word:of@[0]\n",
      "  11  11   0   0  | NN->CC if Pos:NNS@[-1] & Word:and@[0]\n",
      "  10  10   0   0  | NN->, if Pos:VBZ@[-1] & Word:,@[0]\n",
      "  10  10   0   0  | NN->IN if Pos:NN@[-1] & Word:from@[0]\n",
      "  10  10   0   0  | NN->IN if Pos:NN@[-1] & Word:with@[0]\n",
      "   9   9   0   0  | NN->-NONE- if Pos:NN@[-1] & Word:*T*-1@[0]\n",
      "   8   8   0   0  | NN->$ if Pos:NN@[-1] & Word:$@[0]\n",
      "   8   8   0   0  | NN->CD if Pos:CD@[-1] & Word:billion@[0]\n",
      "   8   8   0   0  | NN->IN if Pos:NN@[-1] & Word:on@[0]\n",
      "   8   8   0   0  | NN->IN if Pos:NNS@[-1] & Word:in@[0]\n",
      "   7   7   0  14  | NN->-NONE- if Pos:-NONE-@[-1]\n",
      "   7   7   0   0  | NN->-NONE- if Pos:VBD@[-1] & Word:*@[0]\n",
      "   7   7   0   0  | NN->-NONE- if Pos:VBD@[-1] & Word:*-1@[0]\n",
      "   7   7   0   0  | NN->DT if Pos:VBD@[-1] & Word:a@[0]\n",
      "   7   7   0   0  | NNS->VBZ if Pos:NN@[-1] & Word:is@[0]\n",
      "   6   6   0   0  | VBZ->NNS if Pos:VBD@[-1]\n",
      "   6   6   0   0  | NN->. if Pos:VBZ@[-1] & Word:.@[0]\n",
      "   6   6   0   0  | NN->DT if Pos:VBD@[-1] & Word:the@[0]\n",
      "   6   6   0   0  | NN->IN if Pos:NN@[-1] & Word:than@[0]\n",
      "   6   6   0   0  | VBZ->NNS if Pos:NN@[-1] & Word:rates@[0]\n",
      "   5   5   0   0  | NN->$ if Pos:IN@[-1] & Word:$@[0]\n",
      "   5   5   0   0  | NN->-NONE- if Pos:NN@[-1] & Word:*-1@[0]\n",
      "   5   5   0   0  | NN->CC if Pos:VBZ@[-1] & Word:and@[0]\n",
      "   5   5   0   0  | NN->CD if Pos:CD@[-1] & Word:million@[0]\n",
      "   5   5   0   0  | NN->IN if Pos:NN@[-1] & Word:at@[0]\n",
      "   5   5   0   0  | NN->IN if Pos:NN@[-1] & Word:by@[0]\n",
      "   5   5   0   0  | NN->PRP if Pos:NN@[-1] & Word:it@[0]\n",
      "   5   5   0   0  | NN->VBD if Pos:NNS@[-1] & Word:were@[0]\n",
      "   5   5   0   0  | NNS->VBZ if Pos:NN@[-1] & Word:has@[0]\n",
      "   5   5   0   0  | NN->RB if Pos:VBZ@[-1] & Word:n't@[0]\n",
      "   4   4   0   0  | VBG->NN if Pos:CC@[-1]\n",
      "   4   4   0   0  | NN->: if Pos:NN@[-1] & Word:--@[0]\n",
      "   4   4   0   0  | NN->CC if Pos:NN@[-1] & Word:&@[0]\n",
      "   4   4   0   0  | NN->DT if Pos:,@[-1] & Word:a@[0]\n",
      "   4   4   0   0  | NN->DT if Pos:VBG@[-1] & Word:the@[0]\n",
      "   4   4   0   0  | VBZ->NNS if Pos:DT@[-1]\n",
      "   4   4   0   0  | NN->IN if Pos:NNS@[-1] & Word:at@[0]\n",
      "   4   4   0   0  | NN->IN if Pos:NNS@[-1] & Word:for@[0]\n",
      "   4   4   0   0  | NN->IN if Pos:VBZ@[-1] & Word:for@[0]\n",
      "   4   4   0   0  | NN->NNP if Pos:NN@[-1] & Word:Korea@[0]\n",
      "   4   4   0   0  | NN->NNP if Pos:NN@[-1] & Word:Talcott@[0]\n",
      "   4   4   0   0  | NN->TO if Pos:VBG@[-1] & Word:to@[0]\n",
      "   4   4   0   0  | NN->VBP if Pos:NNS@[-1] & Word:are@[0]\n",
      "   4   4   0   0  | NN->WDT if Pos:,@[-1] & Word:which@[0]\n",
      "   4   4   0   2  | NN->WDT if Pos:NN@[-1] & Word:that@[0]\n",
      "   5   5   0   1  | NN->-NONE- if Pos:WDT@[-1]\n",
      "   4   4   0   0  | NNS->NN if Pos:IN@[-1] & Word:asbestos@[0]\n",
      "   4   4   0   0  | NNS->NN if Pos:NN@[-1] & Word:asbestos@[0]\n",
      "   4   4   0   0  | NNS->VBD if Pos:,@[-1] & Word:was@[0]\n",
      "   4   4   0   1  | VBD->VBN if Pos:VBD@[-1]\n",
      "   4   4   0   0  | NNS->VBD if Pos:NN@[-1] & Word:was@[0]\n",
      "   3   3   0   0  | NN->-NONE- if Pos:VBN@[-1]\n",
      "   3   3   0   0  | VBZ->NNS if Pos:VBG@[-1]\n",
      "   4   4   0   0  | NN->IN if Pos:NNS@[-1] & Word:because@[0]\n",
      "   3   3   0   0  | -NONE-->DT if Pos:-NONE-@[-1] & Word:the@[0]\n",
      "   4   4   0   9  | NN->IN if Pos:-NONE-@[-1]\n",
      "   4   4   0   0  | NNS->DT if Pos:IN@[-1] & Word:this@[0]\n",
      "   3   3   0   0  | NN->'' if Pos:,@[-1] & Word:''@[0]\n",
      "   3   3   0   0  | NN->, if Pos:CD@[-1] & Word:,@[0]\n",
      "   3   3   0   0  | NN->-NONE- if Pos:VBD@[-1] & Word:*T*-1@[0]\n",
      "   3   3   0   0  | NN->. if Pos:CD@[-1] & Word:.@[0]\n",
      "   3   3   0   0  | NN->CC if Pos:NN@[-1] & Word:or@[0]\n",
      "   3   3   0   0  | NN->CD if Pos:CD@[-1] & Word:trillion@[0]\n",
      "   3   3   0   0  | NN->DT if Pos:IN@[-1] & Word:any@[0]\n",
      "   3   3   0   0  | NN->DT if Pos:NN@[-1] & Word:all@[0]\n",
      "   3   3   0   0  | NN->DT if Pos:NN@[-1] & Word:those@[0]\n",
      "   3   3   0   0  | NN->DT if Pos:NNS@[-1] & Word:a@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:NN@[-1] & Word:because@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:NN@[-1] & Word:before@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:NNS@[-1] & Word:ago@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:NNS@[-1] & Word:from@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:NNS@[-1] & Word:like@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:VBD@[-1] & Word:by@[0]\n",
      "   3   3   0   0  | NN->IN if Pos:VBZ@[-1] & Word:in@[0]\n",
      "   3   3   0   0  | NN->JJ if Pos:DT@[-1] & Word:few@[0]\n",
      "   3   3   0   0  | NN->JJ if Pos:NN@[-1] & Word:average@[0]\n",
      "   3   3   0   0  | NN->JJ if Pos:NNS@[-1] & Word:old@[0]\n",
      "   3   3   0   0  | NN->JJR if Pos:NN@[-1] & Word:higher@[0]\n",
      "   3   3   0   0  | NN->JJS if Pos:DT@[-1] & Word:latest@[0]\n",
      "   3   3   0   0  | NN->MD if Pos:NN@[-1] & Word:will@[0]\n",
      "   5   5   0   1  | NN->VB if Pos:MD@[-1]\n",
      "   3   3   0   0  | NN->NNP if Pos:DT@[-1] & Word:U.S.@[0]\n",
      "   3   3   0   0  | NN->NNP if Pos:IN@[-1] & Word:October@[0]\n"
     ]
    }
   ],
   "source": [
    "# 改变 max_rules 可以提高词性标注的性能\n",
    "tagger2 = tt.train(training_data, max_rules=100, min_acc=0.99)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 250,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.5616605616605617"
      ]
     },
     "execution_count": 250,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "tagger2.evaluate(gold_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.1"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
